{ "package": "vLLM", "version": "0.17.1", "stubs_only": "no", "py_typed": "YES", "pypi": { "upload_time": "2026-03-11T11:03:58.693896Z", "requires_python": "<3.14,>=3.10", "size": 30547577, "sha256": "d26a95dcb92e2ff78ed4b48bff247d845b0c768edf6c0acf2401376a56c57b61" }, "metadata": { "Metadata-Version": [ "2.4" ], "Name": [ "vllm" ], "Version": [ "0.17.1" ], "Summary": [ "A high-throughput and memory-efficient inference and serving engine for LLMs" ], "Author": [ "vLLM Team" ], "License-Expression": [ "Apache-2.0" ], "Project-URL": [ "Homepage, https://github.com/vllm-project/vllm", "Documentation, https://docs.vllm.ai/en/latest/", "Slack, https://slack.vllm.ai/" ], "Classifier": [ "Programming Language :: Python :: 3.10", "Programming Language :: Python :: 3.11", "Programming Language :: Python :: 3.12", "Programming Language :: Python :: 3.13", "Intended Audience :: Developers", "Intended Audience :: Information Technology", "Intended Audience :: Science/Research", "Topic :: Scientific/Engineering :: Artificial Intelligence", "Topic :: Scientific/Engineering :: Information Analysis" ], "Requires-Python": [ "<3.14,>=3.10" ], "Description-Content-Type": [ "text/markdown" ], "License-File": [ "LICENSE" ], "Requires-Dist": [ "regex", "cachetools", "psutil", "sentencepiece", "numpy", "requests>=2.26.0", "tqdm", "blake3", "py-cpuinfo", "transformers<5,>=4.56.0", "tokenizers>=0.21.1", "protobuf!=6.30.*,!=6.31.*,!=6.32.*,!=6.33.0.*,!=6.33.1.*,!=6.33.2.*,!=6.33.3.*,!=6.33.4.*,>=5.29.6", "fastapi[standard]>=0.115.0", "aiohttp>=3.13.3", "openai<2.25.0,>=1.99.1", "pydantic>=2.12.0", "prometheus_client>=0.18.0", "pillow", "prometheus-fastapi-instrumentator>=7.0.0", "tiktoken>=0.6.0", "lm-format-enforcer==0.11.3", "llguidance<1.4.0,>=1.3.0; platform_machine == \"x86_64\" or platform_machine == \"arm64\" or platform_machine == \"aarch64\" or platform_machine == \"s390x\" or platform_machine == \"ppc64le\"", "outlines_core==0.2.11", "diskcache==5.6.3", "lark==1.2.2", "xgrammar==0.1.29; platform_machine == \"x86_64\" or platform_machine == \"aarch64\" or platform_machine == \"arm64\" or platform_machine == \"s390x\" or platform_machine == \"ppc64le\"", "typing_extensions>=4.10", "filelock>=3.16.1", "partial-json-parser", "pyzmq>=25.0.0", "msgspec", "gguf>=0.17.0", "mistral_common[image]>=1.9.1", "opencv-python-headless>=4.13.0", "pyyaml", "six>=1.16.0; python_version > \"3.11\"", "setuptools<81.0.0,>=77.0.3; python_version > \"3.11\"", "einops", "compressed-tensors==0.13.0", "depyf==0.20.0", "cloudpickle", "watchfiles", "python-json-logger", "ninja", "pybase64", "cbor2", "ijson", "setproctitle", "openai-harmony>=0.0.3", "anthropic>=0.71.0", "model-hosting-container-standards<1.0.0,>=0.1.13", "mcp", "grpcio", "grpcio-reflection", "opentelemetry-sdk>=1.27.0", "opentelemetry-api>=1.27.0", "opentelemetry-exporter-otlp>=1.27.0", "opentelemetry-semantic-conventions-ai>=0.4.1", "kaldi-native-fbank>=1.18.7", "numba==0.61.2", "ray[cgraph]>=2.48.0", "torch==2.10.0", "torchaudio==2.10.0", "torchvision==0.25.0", "flashinfer-python==0.6.4", "nvidia-cudnn-frontend<1.19.0,>=1.13.0", "nvidia-cutlass-dsl>=4.4.0.dev1", "quack-kernels>=0.2.7", "pandas; extra == \"bench\"", "matplotlib; extra == \"bench\"", "seaborn; extra == \"bench\"", "datasets; extra == \"bench\"", "scipy; extra == \"bench\"", "plotly; extra == \"bench\"", "tensorizer==2.10.1; extra == \"tensorizer\"", "fastsafetensors>=0.2.2; extra == \"fastsafetensors\"", "runai-model-streamer[gcs,s3]>=0.15.3; extra == \"runai\"", "librosa; extra == \"audio\"", "scipy; extra == \"audio\"", "soundfile; extra == \"audio\"", "mistral_common[audio]; extra == \"audio\"", "petit-kernel; extra == \"petit-kernel\"", "helion; extra == \"helion\"", "opentelemetry-sdk>=1.26.0; extra == \"otel\"", "opentelemetry-api>=1.26.0; extra == \"otel\"", "opentelemetry-exporter-otlp>=1.26.0; extra == \"otel\"", "opentelemetry-semantic-conventions-ai>=0.4.1; extra == \"otel\"" ], "Provides-Extra": [ "bench", "tensorizer", "fastsafetensors", "runai", "audio", "video", "flashinfer", "petit-kernel", "helion", "otel" ], "Dynamic": [ "license-file", "provides-extra", "requires-dist" ] }, "module_reports": [ { "path": "vllm/outputs.py", "symbol_reports": [ { "kind": "class", "name": "vllm.outputs.ClassificationRequestOutput", "methods": [ { "kind": "function", "name": "ClassificationRequestOutput.from_base", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.outputs.EmbeddingRequestOutput", "methods": [ { "kind": "function", "name": "EmbeddingRequestOutput.from_base", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.outputs.PoolingRequestOutput", "methods": [ { "kind": "function", "name": "PoolingRequestOutput.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PoolingRequestOutput.__repr__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingRequestOutput.request_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PoolingRequestOutput.prompt_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PoolingRequestOutput.num_cached_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PoolingRequestOutput.finished", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PoolingRequestOutput.outputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 5, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.outputs.CompletionOutput", "methods": [ { "kind": "function", "name": "CompletionOutput.finished", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompletionOutput.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompletionOutput.index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompletionOutput.text", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompletionOutput.token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompletionOutput.cumulative_logprob", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompletionOutput.logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompletionOutput.routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompletionOutput.finish_reason", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompletionOutput.stop_reason", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompletionOutput.lora_request", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.outputs.EmbeddingOutput", "methods": [ { "kind": "function", "name": "EmbeddingOutput.from_base", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EmbeddingOutput.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "EmbeddingOutput.hidden_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "EmbeddingOutput.embedding", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 1, "n_properties": 1 }, { "kind": "class", "name": "vllm.outputs.ClassificationOutput", "methods": [ { "kind": "function", "name": "ClassificationOutput.from_base", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ClassificationOutput.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "ClassificationOutput.num_classes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ClassificationOutput.probs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 1, "n_properties": 1 }, { "kind": "class", "name": "vllm.outputs.ScoringOutput", "methods": [ { "kind": "function", "name": "ScoringOutput.from_base", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ScoringOutput.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ScoringOutput.score", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.outputs.PoolingOutput", "methods": [ { "kind": "function", "name": "PoolingOutput.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PoolingOutput.__eq__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingOutput.data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.outputs.ScoringRequestOutput", "methods": [ { "kind": "function", "name": "ScoringRequestOutput.from_base", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.outputs.RequestOutput", "methods": [ { "kind": "function", "name": "RequestOutput.__init__", "n_typed": 13, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "RequestOutput.add", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RequestOutput.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RequestOutput.request_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestOutput.prompt", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestOutput.prompt_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestOutput.prompt_logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestOutput.outputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestOutput.finished", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestOutput.metrics", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestOutput.lora_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestOutput.encoder_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestOutput.encoder_prompt_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestOutput.num_cached_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestOutput.kv_transfer_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 17, "n_any": 1, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 15, "n_attrs": 12, "n_properties": 0 }, { "kind": "attr", "name": "vllm.outputs.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.outputs.STREAM_FINISHED", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.outputs", "names": [ "vllm.outputs.ClassificationOutput", "vllm.outputs.ClassificationRequestOutput", "vllm.outputs.CompletionOutput", "vllm.outputs.EmbeddingOutput", "vllm.outputs.EmbeddingRequestOutput", "vllm.outputs.PoolingOutput", "vllm.outputs.PoolingRequestOutput", "vllm.outputs.RequestOutput", "vllm.outputs.STREAM_FINISHED", "vllm.outputs.ScoringOutput", "vllm.outputs.ScoringRequestOutput", "vllm.outputs.logger" ], "n_typable": 66, "n_typed": 38, "n_any": 1, "n_untyped": 27, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 27, "n_classes": 10, "n_attrs": 32, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/v1/engine/async_llm.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.engine.async_llm.AsyncLLM", "methods": [ { "kind": "function", "name": "AsyncLLM.__init__", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "AsyncLLM.from_vllm_config", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "AsyncLLM.from_engine_args", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AsyncLLM.__del__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncLLM.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncLLM.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncLLM.add_request", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "AsyncLLM._add_request", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "AsyncLLM._add_streaming_input_request", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "AsyncLLM._validate_streaming_input_sampling_params", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncLLM.generate", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "AsyncLLM._run_output_handler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncLLM.abort", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncLLM.pause_generation", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AsyncLLM.resume_generation", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncLLM.is_paused", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncLLM.encode", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "AsyncLLM.get_tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncLLM.is_tracing_enabled", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncLLM.do_log_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncLLM.check_health", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncLLM.start_profile", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncLLM.stop_profile", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncLLM.reset_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncLLM.reset_prefix_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncLLM.reset_encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncLLM.sleep", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncLLM.wake_up", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncLLM.is_sleeping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncLLM.add_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncLLM.remove_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncLLM.list_loras", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncLLM.pin_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncLLM.collective_rpc", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AsyncLLM.wait_for_requests_to_drain", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncLLM.scale_elastic_ep", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncLLM.init_weight_transfer_engine", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncLLM.update_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "AsyncLLM.tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "AsyncLLM.is_running", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "AsyncLLM.is_stopped", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "AsyncLLM.errored", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "AsyncLLM.dead_error", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "AsyncLLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncLLM.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncLLM.observability_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncLLM.log_requests", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncLLM.log_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncLLM.renderer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncLLM.io_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncLLM.input_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncLLM.output_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncLLM.engine_core", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncLLM.logger_manager", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AsyncLLM.output_handler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AsyncLLM.profiler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 150, "n_typed": 131, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 38, "n_method_overloads": 38, "n_method_params": 94, "n_attrs": 13, "n_properties": 5 }, { "kind": "attr", "name": "vllm.v1.engine.async_llm.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.engine.async_llm.InputStreamError", "methods": [ { "kind": "function", "name": "InputStreamError.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InputStreamError.cause", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.engine.async_llm", "names": [ "vllm.v1.engine.async_llm.AsyncLLM", "vllm.v1.engine.async_llm.InputStreamError", "vllm.v1.engine.async_llm.logger" ], "n_typable": 154, "n_typed": 132, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 39, "n_method_overloads": 39, "n_method_params": 95, "n_classes": 2, "n_attrs": 15, "n_properties": 5, "n_type_ignores": 0 }, { "path": "vllm/v1/executor/ray_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.executor.ray_utils.initialize_ray_cluster", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.v1.executor.ray_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.executor.ray_utils.PG_WAIT_TIMEOUT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.executor.ray_utils.get_num_tpu_nodes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.v1.executor.ray_utils.ray_import_err", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.executor.ray_utils.assert_ray_available", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.v1.executor.ray_utils.ray", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.executor.ray_utils.ray_is_available", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.v1.executor.ray_utils.get_num_nodes_in_placement_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.v1.executor.ray_utils.FutureWrapper", "methods": [ { "kind": "function", "name": "FutureWrapper.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FutureWrapper.result", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FutureWrapper.ref_or_refs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FutureWrapper.aggregator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 1, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.executor.ray_utils.RayWorkerWrapper", "methods": [ { "kind": "function", "name": "RayWorkerWrapper.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RayWorkerWrapper.get_node_ip", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RayWorkerWrapper.get_node_and_gpu_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RayWorkerWrapper.setup_device_if_necessary", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RayWorkerWrapper.execute_model_ray", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RayWorkerWrapper.override_env_vars", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RayWorkerWrapper._is_intermediate_tensors", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RayWorkerWrapper._is_last_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RayWorkerWrapper.compiled_dag_cuda_device_set", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 8, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": null }, { "kind": "type", "rules": null } ], "name": "vllm.v1.executor.ray_utils", "names": [ "vllm.v1.executor.ray_utils.FutureWrapper", "vllm.v1.executor.ray_utils.PG_WAIT_TIMEOUT", "vllm.v1.executor.ray_utils.RayWorkerWrapper", "vllm.v1.executor.ray_utils.assert_ray_available", "vllm.v1.executor.ray_utils.get_num_nodes_in_placement_group", "vllm.v1.executor.ray_utils.get_num_tpu_nodes", "vllm.v1.executor.ray_utils.initialize_ray_cluster", "vllm.v1.executor.ray_utils.logger", "vllm.v1.executor.ray_utils.ray", "vllm.v1.executor.ray_utils.ray_import_err", "vllm.v1.executor.ray_utils.ray_is_available" ], "n_typable": 29, "n_typed": 14, "n_any": 0, "n_untyped": 15, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 2, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 8, "n_classes": 2, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 2 }, { "path": "vllm/inputs/data.py", "symbol_reports": [ { "kind": "class", "name": "vllm.inputs.data.TextPrompt", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TextPrompt.prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.inputs.data.PromptType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.inputs.data.TokensPrompt", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TokensPrompt.prompt_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokensPrompt.prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokensPrompt.token_type_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.inputs.data.SingletonInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.inputs.data.EmbedsInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EmbedsInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbedsInputs.prompt_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbedsInputs.prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.inputs.data.embeds_inputs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.inputs.data.DecoderOnlyInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.inputs.data.SingletonPrompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.inputs.data.DataPrompt", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DataPrompt.data", "n_typed": 0, "n_any": 1, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DataPrompt.data_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.inputs.data.EmbedsPrompt", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EmbedsPrompt.prompt_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbedsPrompt.prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.inputs.data.token_inputs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.inputs.data.ExplicitEncoderDecoderPrompt", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ExplicitEncoderDecoderPrompt.encoder_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExplicitEncoderDecoderPrompt.decoder_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.inputs.data.EncoderDecoderInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EncoderDecoderInputs.type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EncoderDecoderInputs.encoder_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EncoderDecoderInputs.decoder_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EncoderDecoderInputs.arrival_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.inputs.data.TokenInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TokenInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenInputs.prompt_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenInputs.prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.inputs.data.ProcessorInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.inputs.data.EncoderDecoderPrompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.inputs.data.build_enc_dec_inputs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.inputs.data.MultiModalDataDict", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.inputs.data.MultiModalEncDecInputs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.inputs.data.DecoderInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.inputs.data.DecoderOnlyPrompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.inputs.data.MultiModalInputs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.inputs.data.DecoderPrompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.inputs.data.MultiModalUUIDDict", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.inputs.data.EncoderPrompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.inputs.data.EncoderInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.inputs.data", "names": [ "vllm.inputs.data.DataPrompt", "vllm.inputs.data.DecoderInputs", "vllm.inputs.data.DecoderOnlyInputs", "vllm.inputs.data.DecoderOnlyPrompt", "vllm.inputs.data.DecoderPrompt", "vllm.inputs.data.EmbedsInputs", "vllm.inputs.data.EmbedsPrompt", "vllm.inputs.data.EncoderDecoderInputs", "vllm.inputs.data.EncoderDecoderPrompt", "vllm.inputs.data.EncoderInputs", "vllm.inputs.data.EncoderPrompt", "vllm.inputs.data.ExplicitEncoderDecoderPrompt", "vllm.inputs.data.MultiModalDataDict", "vllm.inputs.data.MultiModalEncDecInputs", "vllm.inputs.data.MultiModalInputs", "vllm.inputs.data.MultiModalUUIDDict", "vllm.inputs.data.ProcessorInputs", "vllm.inputs.data.PromptType", "vllm.inputs.data.SingletonInputs", "vllm.inputs.data.SingletonPrompt", "vllm.inputs.data.TextPrompt", "vllm.inputs.data.TokenInputs", "vllm.inputs.data.TokensPrompt", "vllm.inputs.data.build_enc_dec_inputs", "vllm.inputs.data.embeds_inputs", "vllm.inputs.data.token_inputs" ], "n_typable": 37, "n_typed": 36, "n_any": 1, "n_untyped": 0, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 9, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 8, "n_attrs": 35, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/registry.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.registry.ModelRegistry", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.registry.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.registry", "names": [ "vllm.model_executor.models.registry.ModelRegistry", "vllm.model_executor.models.registry.logger" ], "n_typable": 2, "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/llm.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.llm.LLM", "methods": [ { "kind": "function", "name": "LLM.__init__", "n_typed": 37, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 38, "n_params": 37, "n_function_overloads": 1, "n_function_params": 37 }, { "kind": "function", "name": "LLM.get_tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLM.get_world_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LLM.reset_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLM.get_default_sampling_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLM.generate", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "LLM.enqueue", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "LLM.wait_for_completion", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 3, "n_params": 2, "n_function_overloads": 2, "n_function_params": 2 }, { "kind": "function", "name": "LLM._resolve_mm_lora", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LLM.collective_rpc", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LLM.apply_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LLM.beam_search", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LLM._preprocess_cmpl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LLM._preprocess_cmpl_one", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LLM._preprocess_chat", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "LLM._preprocess_chat_one", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "LLM.chat", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "LLM.encode", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "LLM.embed", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LLM.classify", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LLM.reward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LLM._embedding_score", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "LLM._late_interaction_score", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "LLM._cross_encoding_score", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "LLM.score", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "LLM.start_profile", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LLM.stop_profile", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLM.reset_prefix_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LLM.sleep", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LLM.wake_up", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LLM.get_metrics", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLM._params_to_seq", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LLM._lora_request_to_seq", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LLM._priority_to_seq", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LLM._add_completion_requests", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "LLM._run_completion", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "LLM._run_chat", "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "LLM._render_and_run_requests", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "LLM._render_and_add_requests", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LLM._add_request", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LLM._run_engine", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LLM.init_weight_transfer_engine", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LLM.update_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LLM.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LLM.llm_engine", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLM.engine_class", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLM.request_counter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLM.default_sampling_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LLM.supported_tasks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLM.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLM.renderer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLM.chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLM.io_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLM.input_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLM.chat_template_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLM.init_pooling_io_processors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 257, "n_typed": 240, "n_any": 1, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 44, "n_method_overloads": 45, "n_method_params": 201, "n_attrs": 12, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.llm.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.llm", "names": [ "vllm.entrypoints.llm.LLM", "vllm.entrypoints.llm.logger" ], "n_typable": 258, "n_typed": 240, "n_any": 1, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 44, "n_method_overloads": 45, "n_method_params": 201, "n_classes": 1, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/pooling_params.py", "symbol_reports": [ { "kind": "class", "name": "vllm.pooling_params.PoolingParams", "methods": [ { "kind": "function", "name": "PoolingParams.clone", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PoolingParams.verify", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingParams._merge_default_parameters", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingParams._verify_step_pooling", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PoolingParams._set_default_parameters", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingParams._verify_valid_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PoolingParams.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PoolingParams.__post_init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "PoolingParams.all_parameters", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PoolingParams.valid_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "PoolingParams.use_activation", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingParams.dimensions", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingParams.step_tag_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingParams.returned_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingParams.task", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingParams.requires_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingParams.skip_reading_prefix_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingParams.extra_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingParams.output_kind", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 24, "n_typed": 20, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 5, "n_attrs": 9, "n_properties": 2 } ], "type_ignores": [ { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] } ], "name": "vllm.pooling_params", "names": [ "vllm.pooling_params.PoolingParams" ], "n_typable": 24, "n_typed": 20, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 5, "n_classes": 1, "n_attrs": 9, "n_properties": 2, "n_type_ignores": 2 }, { "path": "vllm/version.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.version.__version__", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.version.__version_tuple__", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.version", "names": [ "vllm.version.__version__", "vllm.version.__version_tuple__" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/sampling_params.py", "symbol_reports": [ { "kind": "class", "name": "vllm.sampling_params.SamplingParams", "methods": [ { "kind": "function", "name": "SamplingParams.from_optional", "n_typed": 29, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 29, "n_params": 28, "n_function_overloads": 1, "n_function_params": 28 }, { "kind": "function", "name": "SamplingParams.__post_init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SamplingParams._verify_args", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SamplingParams._verify_greedy_sampling", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SamplingParams.update_from_generation_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SamplingParams.update_from_tokenizer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SamplingParams.clone", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SamplingParams.verify", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SamplingParams._validate_logprobs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SamplingParams._validate_logit_bias", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SamplingParams._validate_logits_processors", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SamplingParams._validate_allowed_token_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SamplingParams._validate_spec_decode", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SamplingParams._validate_structured_outputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SamplingParams.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SamplingParams.for_sampler_warmup", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "SamplingParams.sampling_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "SamplingParams.eos_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "SamplingParams.all_stop_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "SamplingParams.bad_words_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "SamplingParams.n", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.presence_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.frequency_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.repetition_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.temperature", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.top_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.top_k", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.min_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.seed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.stop", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.stop_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.ignore_eos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.max_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.min_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.prompt_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.flat_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.detokenize", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.skip_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.spaces_between_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.include_stop_str_in_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.output_kind", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.skip_clone", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.output_text_buffer_length", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams._eos_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams._all_stop_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.structured_outputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.logit_bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.allowed_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.extra_args", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.bad_words", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams._bad_words_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.skip_reading_prefix_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.repetition_detection", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 96, "n_typed": 96, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 42, "n_attrs": 34, "n_properties": 4 }, { "kind": "class", "name": "vllm.sampling_params.RequestOutputKind", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RequestOutputKind.CUMULATIVE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestOutputKind.DELTA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestOutputKind.FINAL_ONLY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.sampling_params.SamplingType", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SamplingType.GREEDY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingType.RANDOM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingType.RANDOM_SEED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.sampling_params.BeamSearchParams", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "BeamSearchParams.beam_width", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BeamSearchParams.max_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BeamSearchParams.ignore_eos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BeamSearchParams.temperature", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BeamSearchParams.length_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BeamSearchParams.include_stop_str_in_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.sampling_params.StructuredOutputsParams", "methods": [ { "kind": "function", "name": "StructuredOutputsParams.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StructuredOutputsParams.all_constraints_none", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StructuredOutputsParams.all_non_structural_tag_constraints_none", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StructuredOutputsParams.json", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputsParams.regex", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputsParams.choice", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputsParams.grammar", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputsParams.json_object", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputsParams.disable_fallback", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputsParams.disable_any_whitespace", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputsParams.disable_additional_properties", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputsParams.whitespace_pattern", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputsParams.structural_tag", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputsParams._backend", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputsParams._backend_was_auto", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 0, "n_attrs": 12, "n_properties": 0 }, { "kind": "attr", "name": "vllm.sampling_params.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.sampling_params.RepetitionDetectionParams", "methods": [ { "kind": "function", "name": "RepetitionDetectionParams.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RepetitionDetectionParams.max_pattern_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RepetitionDetectionParams.min_pattern_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RepetitionDetectionParams.min_count", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] } ], "name": "vllm.sampling_params", "names": [ "vllm.sampling_params.BeamSearchParams", "vllm.sampling_params.RepetitionDetectionParams", "vllm.sampling_params.RequestOutputKind", "vllm.sampling_params.SamplingParams", "vllm.sampling_params.SamplingType", "vllm.sampling_params.StructuredOutputsParams", "vllm.sampling_params.logger" ], "n_typable": 107, "n_typed": 104, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 20, "n_method_overloads": 20, "n_method_params": 42, "n_classes": 6, "n_attrs": 62, "n_properties": 4, "n_type_ignores": 4 }, { "path": "vllm/v1/engine/llm_engine.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.engine.llm_engine.LLMEngine", "methods": [ { "kind": "function", "name": "LLMEngine.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "LLMEngine.from_vllm_config", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LLMEngine.from_engine_args", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LLMEngine.get_num_unfinished_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLMEngine.has_unfinished_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLMEngine.has_unfinished_requests_dp", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LLMEngine.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLMEngine.abort_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LLMEngine.add_request", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "LLMEngine.step", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLMEngine.start_profile", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LLMEngine.stop_profile", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLMEngine.reset_mm_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLMEngine.reset_prefix_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LLMEngine.reset_encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLMEngine.sleep", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LLMEngine.wake_up", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LLMEngine.is_sleeping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLMEngine.get_metrics", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLMEngine.get_tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLMEngine.do_log_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLMEngine.do_log_stats_with_interval", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLMEngine.add_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LLMEngine.remove_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LLMEngine.list_loras", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LLMEngine.pin_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LLMEngine.collective_rpc", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LLMEngine.apply_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LLMEngine.__del__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "LLMEngine.tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "LLMEngine.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLMEngine.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLMEngine.observability_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLMEngine.log_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLMEngine.external_launcher_dp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLMEngine.should_execute_dummy_batch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLMEngine.renderer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLMEngine.io_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLMEngine.input_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLMEngine.output_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLMEngine.engine_core", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLMEngine.logger_manager", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LLMEngine.dp_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LLMEngine.model_executor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 87, "n_typed": 68, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 29, "n_method_overloads": 29, "n_method_params": 43, "n_attrs": 14, "n_properties": 1 }, { "kind": "attr", "name": "vllm.v1.engine.llm_engine.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.engine.llm_engine", "names": [ "vllm.v1.engine.llm_engine.LLMEngine", "vllm.v1.engine.llm_engine.logger" ], "n_typable": 88, "n_typed": 68, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 29, "n_method_overloads": 29, "n_method_params": 43, "n_classes": 1, "n_attrs": 15, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/engine/arg_utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.engine.arg_utils.EngineArgs", "methods": [ { "kind": "function", "name": "EngineArgs.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineArgs.add_cli_args", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineArgs.from_cli_args", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineArgs.create_model_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineArgs.validate_tensorizer_args", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineArgs.create_load_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineArgs.create_speculative_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineArgs.create_engine_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineArgs._check_feature_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineArgs.get_batch_defaults", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineArgs._set_default_chunked_prefill_and_prefix_caching_args", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineArgs._set_default_max_num_seqs_and_batched_tokens_args", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EngineArgs.model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_return_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.model_weights", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.served_model_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.hf_config_path", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.runner", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.convert", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.skip_tokenizer_init", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_prompt_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.tokenizer_mode", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.trust_remote_code", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.allowed_local_media_path", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.allowed_media_domains", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.download_dir", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.safetensors_load_strategy", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.load_format", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.config_format", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.seed", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.cudagraph_capture_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.max_cudagraph_capture_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.distributed_executor_backend", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.pipeline_parallel_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.master_addr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.master_port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.nnodes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.node_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.tensor_parallel_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.prefill_context_parallel_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.decode_context_parallel_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.dcp_kv_cache_interleave_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.cp_kv_cache_interleave_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.data_parallel_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.data_parallel_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.data_parallel_start_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.data_parallel_size_local", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.data_parallel_address", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.data_parallel_rpc_port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.data_parallel_hybrid_lb", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.data_parallel_external_lb", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.data_parallel_backend", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_expert_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.moe_backend", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.all2all_backend", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_elastic_ep", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_dbo", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.ubatch_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.dbo_decode_token_threshold", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.dbo_prefill_token_threshold", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.disable_nccl_for_dp_synchronization", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.eplb_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.expert_placement_strategy", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs._api_process_count", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs._api_process_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.max_parallel_loading_workers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_prefix_caching", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.prefix_caching_hash_algo", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.disable_sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.disable_cascade_attn", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.swap_space", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.offload_backend", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.cpu_offload_gb", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.cpu_offload_params", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.offload_group_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.offload_num_in_group", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.offload_prefetch_step", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.offload_params", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.gpu_memory_utilization", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.kv_cache_memory_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.max_num_batched_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.max_num_partial_prefills", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.max_long_partial_prefills", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.long_prefill_token_threshold", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.max_num_seqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.max_logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.logprobs_mode", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.disable_log_stats", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.aggregate_engine_logging", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.revision", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.code_revision", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.hf_token", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.hf_overrides", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.tokenizer_revision", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.quantization", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.allow_deprecated_quantization", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enforce_eager", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.disable_custom_all_reduce", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.language_model_only", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.limit_mm_per_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_mm_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.interleave_mm_strings", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.media_io_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.mm_processor_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.mm_processor_cache_gb", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.mm_processor_cache_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.mm_shm_cache_max_object_size_mb", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.mm_encoder_only", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.mm_encoder_tp_mode", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.mm_encoder_attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.io_processor_plugin", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.skip_mm_profiling", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.video_pruning_rate", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_lora", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.max_loras", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.max_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.default_mm_loras", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.fully_sharded_loras", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.max_cpu_loras", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.lora_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_tower_connector_lora", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.specialize_active_lora", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.ray_workers_use_nsight", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.num_gpu_blocks_override", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.model_loader_extra_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.ignore_patterns", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_chunked_prefill", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.disable_chunked_mm_input", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.disable_hybrid_kv_cache_manager", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.structured_outputs_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.reasoning_parser", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.reasoning_parser_plugin", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.speculative_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.show_hidden_metrics_for_version", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.otlp_traces_endpoint", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.collect_detailed_traces", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.kv_cache_metrics", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.kv_cache_metrics_sample", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.cudagraph_metrics", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_layerwise_nvtx_tracing", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_mfu_metrics", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_logging_iteration_details", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_mm_processor_stats", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.scheduling_policy", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.scheduler_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.pooler_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.attention_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.kernel_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_flashinfer_autotune", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.worker_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.worker_extension_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.profiler_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.kv_transfer_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.kv_events_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.ec_transfer_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.generation_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.enable_sleep_mode", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.override_generation_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.model_impl", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.override_attention_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.attention_backend", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.calculate_kv_scales", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.mamba_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.mamba_ssm_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.mamba_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.mamba_cache_mode", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.additional_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.use_tqdm_on_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.pt_load_map_location", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.logits_processors", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.async_scheduling", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.stream_interval", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.kv_sharing_fast_prefill", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.optimization_level", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.performance_mode", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.kv_offloading_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.kv_offloading_backend", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.tokens_only", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.weight_transfer_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineArgs.fail_on_environ_validation", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 22, "n_typed": 17, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 10, "n_attrs": 175, "n_properties": 0 }, { "kind": "class", "name": "vllm.engine.arg_utils.AsyncEngineArgs", "methods": [ { "kind": "function", "name": "AsyncEngineArgs.add_cli_args", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AsyncEngineArgs.enable_log_requests", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.engine.arg_utils.is_not_builtin", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.engine.arg_utils.collection_to_kwargs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.engine.arg_utils.optional_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.engine.arg_utils.is_type", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.engine.arg_utils.TypeHintT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.engine.arg_utils.parse_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.engine.arg_utils.NEEDS_HELP", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.engine.arg_utils.union_dict_and_str", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.engine.arg_utils.get_kwargs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.engine.arg_utils.T", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.engine.arg_utils.get_type_hints", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.engine.arg_utils.get_type", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.engine.arg_utils.TypeHint", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.engine.arg_utils.human_readable_int_or_auto", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.engine.arg_utils.literal_to_kwargs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.engine.arg_utils.human_readable_int", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.engine.arg_utils.contains_type", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.engine.arg_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.engine.arg_utils", "names": [ "vllm.engine.arg_utils.AsyncEngineArgs", "vllm.engine.arg_utils.EngineArgs", "vllm.engine.arg_utils.NEEDS_HELP", "vllm.engine.arg_utils.T", "vllm.engine.arg_utils.TypeHint", "vllm.engine.arg_utils.TypeHintT", "vllm.engine.arg_utils.collection_to_kwargs", "vllm.engine.arg_utils.contains_type", "vllm.engine.arg_utils.get_kwargs", "vllm.engine.arg_utils.get_type", "vllm.engine.arg_utils.get_type_hints", "vllm.engine.arg_utils.human_readable_int", "vllm.engine.arg_utils.human_readable_int_or_auto", "vllm.engine.arg_utils.is_not_builtin", "vllm.engine.arg_utils.is_type", "vllm.engine.arg_utils.literal_to_kwargs", "vllm.engine.arg_utils.logger", "vllm.engine.arg_utils.optional_type", "vllm.engine.arg_utils.parse_type", "vllm.engine.arg_utils.union_dict_and_str" ], "n_typable": 59, "n_typed": 52, "n_any": 0, "n_untyped": 7, "n_functions": 13, "n_function_overloads": 13, "n_function_params": 17, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 12, "n_classes": 2, "n_attrs": 181, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/assets/audio.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.assets.audio.ASSET_DIR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.assets.audio.AudioAssetName", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.assets.audio.AudioAsset", "methods": [ { "kind": "function", "name": "AudioAsset.get_local_path", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "AudioAsset.filename", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "AudioAsset.audio_and_sample_rate", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "AudioAsset.url", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "AudioAsset.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 3 }, { "kind": "attr", "name": "vllm.assets.audio.librosa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": [ "assignment" ] } ], "name": "vllm.assets.audio", "names": [ "vllm.assets.audio.ASSET_DIR", "vllm.assets.audio.AudioAsset", "vllm.assets.audio.AudioAssetName", "vllm.assets.audio.librosa" ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_classes": 1, "n_attrs": 4, "n_properties": 3, "n_type_ignores": 1 }, { "path": "vllm/assets/base.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.assets.base.VLLM_S3_BUCKET_URL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.assets.base.get_cache_dir", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.assets.base.get_vllm_public_assets", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.assets.base", "names": [ "vllm.assets.base.VLLM_S3_BUCKET_URL", "vllm.assets.base.get_cache_dir", "vllm.assets.base.get_vllm_public_assets" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 2, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/assets/image.py", "symbol_reports": [ { "kind": "class", "name": "vllm.assets.image.ImageAsset", "methods": [ { "kind": "function", "name": "ImageAsset.get_path", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ImageAsset.pil_image_ext", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ImageAsset.read_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "ImageAsset.pil_image", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ImageAsset.image_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ImageAsset.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 1, "n_properties": 2 }, { "kind": "attr", "name": "vllm.assets.image.VLM_IMAGES_DIR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.assets.image.ImageAssetName", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.assets.image", "names": [ "vllm.assets.image.ImageAsset", "vllm.assets.image.ImageAssetName", "vllm.assets.image.VLM_IMAGES_DIR" ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_classes": 1, "n_attrs": 3, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/assets/video.py", "symbol_reports": [ { "kind": "function", "name": "vllm.assets.video.download_video_asset", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.assets.video.video_to_ndarrays", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.assets.video.video_to_pil_images_list", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.assets.video.video_get_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.assets.video.VideoAssetName", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.assets.video.VideoAsset", "methods": [ { "kind": "function", "name": "VideoAsset.get_audio", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "VideoAsset.filename", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VideoAsset.video_path", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VideoAsset.pil_images", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VideoAsset.np_ndarrays", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VideoAsset.metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "VideoAsset.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VideoAsset.num_frames", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VideoAsset._NAME_TO_FILE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 3, "n_properties": 5 }, { "kind": "attr", "name": "vllm.assets.video.librosa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": [ "assignment" ] } ], "name": "vllm.assets.video", "names": [ "vllm.assets.video.VideoAsset", "vllm.assets.video.VideoAssetName", "vllm.assets.video.download_video_asset", "vllm.assets.video.librosa", "vllm.assets.video.video_get_metadata", "vllm.assets.video.video_to_ndarrays", "vllm.assets.video.video_to_pil_images_list" ], "n_typable": 20, "n_typed": 19, "n_any": 0, "n_untyped": 1, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 7, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_classes": 1, "n_attrs": 5, "n_properties": 5, "n_type_ignores": 1 }, { "path": "vllm/beam_search.py", "symbol_reports": [ { "kind": "class", "name": "vllm.beam_search.BeamSearchSequence", "methods": [ { "kind": "function", "name": "BeamSearchSequence.get_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BeamSearchSequence.orig_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BeamSearchSequence.tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BeamSearchSequence.logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BeamSearchSequence.lora_request", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BeamSearchSequence.cum_logprob", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BeamSearchSequence.text", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BeamSearchSequence.finish_reason", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BeamSearchSequence.stop_reason", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.beam_search.BeamSearchInstance", "methods": [ { "kind": "function", "name": "BeamSearchInstance.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BeamSearchInstance.beams", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BeamSearchInstance.completed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.beam_search.get_beam_search_score", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.beam_search.create_sort_beams_key_function", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.beam_search.BeamSearchOutput", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "BeamSearchOutput.sequences", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.beam_search", "names": [ "vllm.beam_search.BeamSearchInstance", "vllm.beam_search.BeamSearchOutput", "vllm.beam_search.BeamSearchSequence", "vllm.beam_search.create_sort_beams_key_function", "vllm.beam_search.get_beam_search_score" ], "n_typable": 16, "n_typed": 12, "n_any": 0, "n_untyped": 4, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 6, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_classes": 3, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/collect_env.py", "symbol_reports": [ { "kind": "function", "name": "vllm.collect_env.get_cudnn_version", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.collect_env.get_python_platform", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.collect_env.get_cachingallocator_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.collect_env.get_platform", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.collect_env.get_os", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.collect_env.get_cpu_info", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.collect_env.get_gpu_info", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.collect_env.get_nvidia_driver_version", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.collect_env.check_release_file", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.collect_env.DEFAULT_CONDA_PATTERNS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.collect_env.get_env_info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.collect_env.get_lsb_version", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.collect_env.run", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.collect_env.get_windows_version", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.collect_env.get_running_cuda_version", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.collect_env.get_cmake_version", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.collect_env.TORCH_AVAILABLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.collect_env.get_cuda_module_loading_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.collect_env.get_clang_version", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.collect_env.SystemEnv", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.collect_env.is_uv_venv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.collect_env.get_rocm_version", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.collect_env.get_mac_version", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.collect_env.pretty_str", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.collect_env.get_gpu_topo", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.collect_env.summarize_vllm_build_flags", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.collect_env.get_env_vars", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.collect_env.is_xnnpack_available", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.collect_env.run_and_read_all", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.collect_env.get_vllm_version", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.collect_env.env_info_fmt", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.collect_env.main", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.collect_env.get_conda_packages", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.collect_env.DEFAULT_PIP_PATTERNS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.collect_env.get_pip_packages", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.collect_env.get_pretty_env_info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.collect_env.run_and_parse_first_match", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.collect_env.get_libc_version", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.collect_env.get_gcc_version", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.collect_env.get_nvidia_smi", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.collect_env", "names": [ "vllm.collect_env.DEFAULT_CONDA_PATTERNS", "vllm.collect_env.DEFAULT_PIP_PATTERNS", "vllm.collect_env.SystemEnv", "vllm.collect_env.TORCH_AVAILABLE", "vllm.collect_env.check_release_file", "vllm.collect_env.env_info_fmt", "vllm.collect_env.get_cachingallocator_config", "vllm.collect_env.get_clang_version", "vllm.collect_env.get_cmake_version", "vllm.collect_env.get_conda_packages", "vllm.collect_env.get_cpu_info", "vllm.collect_env.get_cuda_module_loading_config", "vllm.collect_env.get_cudnn_version", "vllm.collect_env.get_env_info", "vllm.collect_env.get_env_vars", "vllm.collect_env.get_gcc_version", "vllm.collect_env.get_gpu_info", "vllm.collect_env.get_gpu_topo", "vllm.collect_env.get_libc_version", "vllm.collect_env.get_lsb_version", "vllm.collect_env.get_mac_version", "vllm.collect_env.get_nvidia_driver_version", "vllm.collect_env.get_nvidia_smi", "vllm.collect_env.get_os", "vllm.collect_env.get_pip_packages", "vllm.collect_env.get_platform", "vllm.collect_env.get_pretty_env_info", "vllm.collect_env.get_python_platform", "vllm.collect_env.get_rocm_version", "vllm.collect_env.get_running_cuda_version", "vllm.collect_env.get_vllm_version", "vllm.collect_env.get_windows_version", "vllm.collect_env.is_uv_venv", "vllm.collect_env.is_xnnpack_available", "vllm.collect_env.main", "vllm.collect_env.pretty_str", "vllm.collect_env.run", "vllm.collect_env.run_and_parse_first_match", "vllm.collect_env.run_and_read_all", "vllm.collect_env.summarize_vllm_build_flags" ], "n_typable": 62, "n_typed": 0, "n_any": 0, "n_untyped": 62, "n_functions": 35, "n_function_overloads": 35, "n_function_params": 26, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/backends.py", "symbol_reports": [ { "kind": "class", "name": "vllm.compilation.backends.PiecewiseCompileInterpreter", "methods": [ { "kind": "function", "name": "PiecewiseCompileInterpreter.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PiecewiseCompileInterpreter.run", "n_typed": 0, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PiecewiseCompileInterpreter.call_module", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PiecewiseCompileInterpreter.fake_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseCompileInterpreter.compile_submod_names", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseCompileInterpreter.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseCompileInterpreter.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseCompileInterpreter.vllm_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseCompileInterpreter.extra_traceback", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 8, "n_any": 3, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.backends.VllmBackend", "methods": [ { "kind": "function", "name": "VllmBackend.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VllmBackend.collect_standalone_compile_artifacts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VllmBackend.configure_post_pass", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VllmBackend._log_compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VllmBackend.__call__", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VllmBackend.vllm_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmBackend.compilation_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmBackend._called", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmBackend.graph", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmBackend.split_gm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmBackend.piecewise_graphs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmBackend.returned_callable", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmBackend.post_grad_passes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmBackend.compiler_manager", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmBackend.inductor_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmBackend.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmBackend.is_encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmBackend.pass_manager", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmBackend.pass_key", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 18, "n_any": 1, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 5, "n_attrs": 14, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.backends.compilation_start_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.compilation.backends.StopCompiling", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.compilation.backends.wrap_with_cudagraph_if_needed", "n_typed": 4, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.compilation.backends.make_copy_and_call", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.compilation.backends.set_on_compilation_complete", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.compilation.backends.SplitItem", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SplitItem.submod_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SplitItem.graph_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SplitItem.is_splitting_graph", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SplitItem.graph", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.compilation.backends.split_graph", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.compilation.backends.model_tag", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.compilation.backends.make_compiler", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.compilation.backends.model_is_encoder", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.compilation.backends.set_model_tag", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.compilation.backends.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.backends.CompilerManager", "methods": [ { "kind": "function", "name": "CompilerManager.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompilerManager.compute_hash", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompilerManager.compile_context", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompilerManager.initialize_cache", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CompilerManager.save_to_file", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompilerManager.load", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CompilerManager.compile", "n_typed": 7, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompilerManager.cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilerManager.is_cache_updated", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompilerManager.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompilerManager.compiler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompilerManager.loaded_artifacts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 29, "n_typed": 25, "n_any": 1, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 17, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": [ "misc" ] } ], "name": "vllm.compilation.backends", "names": [ "vllm.compilation.backends.CompilerManager", "vllm.compilation.backends.PiecewiseCompileInterpreter", "vllm.compilation.backends.SplitItem", "vllm.compilation.backends.StopCompiling", "vllm.compilation.backends.VllmBackend", "vllm.compilation.backends.compilation_start_time", "vllm.compilation.backends.logger", "vllm.compilation.backends.make_compiler", "vllm.compilation.backends.make_copy_and_call", "vllm.compilation.backends.model_is_encoder", "vllm.compilation.backends.model_tag", "vllm.compilation.backends.set_model_tag", "vllm.compilation.backends.set_on_compilation_complete", "vllm.compilation.backends.split_graph", "vllm.compilation.backends.wrap_with_cudagraph_if_needed" ], "n_typable": 93, "n_typed": 71, "n_any": 7, "n_untyped": 15, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 14, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 30, "n_classes": 5, "n_attrs": 33, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/compilation/base_static_graph.py", "symbol_reports": [ { "kind": "class", "name": "vllm.compilation.base_static_graph.AbstractStaticGraphWrapper", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.compilation.base_static_graph", "names": [ "vllm.compilation.base_static_graph.AbstractStaticGraphWrapper" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/caching.py", "symbol_reports": [ { "kind": "function", "name": "vllm.compilation.caching.patch_pytree_map_over_slice", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.compilation.caching.SerializableCallable", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.compilation.caching.VllmSerializableFunction", "methods": [ { "kind": "function", "name": "VllmSerializableFunction.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "VllmSerializableFunction.__call__", "n_typed": 0, "n_any": 3, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmSerializableFunction.serialize_compile_artifacts", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VllmSerializableFunction.deserialize_compile_artifacts", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "VllmSerializableFunction.co_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "VllmSerializableFunction.graph_module", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmSerializableFunction.example_inputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmSerializableFunction.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmSerializableFunction.optimized_call", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmSerializableFunction.is_encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmSerializableFunction.shape_env", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmSerializableFunction.vllm_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmSerializableFunction.sym_tensor_indices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 13, "n_any": 3, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 8, "n_properties": 1 }, { "kind": "function", "name": "vllm.compilation.caching.reconstruct_serializable_fn_from_mega_artifact", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.compilation.caching.StandaloneCompiledArtifacts", "methods": [ { "kind": "function", "name": "StandaloneCompiledArtifacts.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StandaloneCompiledArtifacts.insert", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "StandaloneCompiledArtifacts.get", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StandaloneCompiledArtifacts.get_loaded", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StandaloneCompiledArtifacts.size_bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StandaloneCompiledArtifacts.num_artifacts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StandaloneCompiledArtifacts.num_entries", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StandaloneCompiledArtifacts.submodule_names", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StandaloneCompiledArtifacts.load_all", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StandaloneCompiledArtifacts.__getstate__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StandaloneCompiledArtifacts.__setstate__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StandaloneCompiledArtifacts.submodule_bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StandaloneCompiledArtifacts.submodule_bytes_store", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StandaloneCompiledArtifacts.loaded_submodule_store", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 22, "n_typed": 21, "n_any": 1, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.caching.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.compilation.caching.aot_compile_hash_factors", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [ { "kind": "type", "rules": [ "misc" ] } ], "name": "vllm.compilation.caching", "names": [ "vllm.compilation.caching.SerializableCallable", "vllm.compilation.caching.StandaloneCompiledArtifacts", "vllm.compilation.caching.VllmSerializableFunction", "vllm.compilation.caching.aot_compile_hash_factors", "vllm.compilation.caching.logger", "vllm.compilation.caching.patch_pytree_map_over_slice", "vllm.compilation.caching.reconstruct_serializable_fn_from_mega_artifact" ], "n_typable": 56, "n_typed": 42, "n_any": 4, "n_untyped": 10, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 6, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 19, "n_classes": 2, "n_attrs": 13, "n_properties": 1, "n_type_ignores": 1 }, { "path": "vllm/compilation/compiler_interface.py", "symbol_reports": [ { "kind": "class", "name": "vllm.compilation.compiler_interface.CompilerInterface", "methods": [ { "kind": "function", "name": "CompilerInterface.initialize_cache", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CompilerInterface.compute_hash", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompilerInterface.compile", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CompilerInterface.load", "n_typed": 5, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompilerInterface.name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 19, "n_typed": 18, "n_any": 1, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 14, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.compilation.compiler_interface.is_compile_cache_enabled", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.compilation.compiler_interface.InductorAdaptor", "methods": [ { "kind": "function", "name": "InductorAdaptor.compute_hash", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InductorAdaptor.initialize_cache", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InductorAdaptor.compile", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "InductorAdaptor.load", "n_typed": 5, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "InductorAdaptor.metrics_context", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InductorAdaptor.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 19, "n_typed": 18, "n_any": 1, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 14, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.compilation.compiler_interface.set_functorch_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.compilation.compiler_interface.InductorStandaloneAdaptor", "methods": [ { "kind": "function", "name": "InductorStandaloneAdaptor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InductorStandaloneAdaptor.compute_hash", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InductorStandaloneAdaptor.initialize_cache", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InductorStandaloneAdaptor.compile", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "InductorStandaloneAdaptor.load", "n_typed": 5, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InductorStandaloneAdaptor.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InductorStandaloneAdaptor.save_format", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 19, "n_any": 1, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 15, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.compilation.compiler_interface.set_inductor_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.compilation.compiler_interface.get_inductor_factors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.compilation.compiler_interface.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.compiler_interface.EagerAdaptor", "methods": [ { "kind": "function", "name": "EagerAdaptor.compile", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EagerAdaptor.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.compiler_interface.AlwaysHitShapeEnv", "methods": [ { "kind": "function", "name": "AlwaysHitShapeEnv.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AlwaysHitShapeEnv.evaluate_guards_expression", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AlwaysHitShapeEnv.get_pruned_guards", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AlwaysHitShapeEnv.produce_guards_expression", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AlwaysHitShapeEnv.guards", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 11, "n_typed": 5, "n_any": 6, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.compilation.compiler_interface", "names": [ "vllm.compilation.compiler_interface.AlwaysHitShapeEnv", "vllm.compilation.compiler_interface.CompilerInterface", "vllm.compilation.compiler_interface.EagerAdaptor", "vllm.compilation.compiler_interface.InductorAdaptor", "vllm.compilation.compiler_interface.InductorStandaloneAdaptor", "vllm.compilation.compiler_interface.get_inductor_factors", "vllm.compilation.compiler_interface.is_compile_cache_enabled", "vllm.compilation.compiler_interface.logger", "vllm.compilation.compiler_interface.set_functorch_config", "vllm.compilation.compiler_interface.set_inductor_config" ], "n_typable": 84, "n_typed": 73, "n_any": 9, "n_untyped": 2, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 3, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 54, "n_classes": 5, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/counter.py", "symbol_reports": [ { "kind": "class", "name": "vllm.compilation.counter.CompilationCounter", "methods": [ { "kind": "function", "name": "CompilationCounter.clone", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompilationCounter.expect", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompilationCounter.num_models_seen", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompilationCounter.num_graphs_seen", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompilationCounter.num_piecewise_graphs_seen", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompilationCounter.num_piecewise_capturable_graphs_seen", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompilationCounter.num_backend_compilations", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompilationCounter.num_gpu_runner_capture_triggers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompilationCounter.num_cudagraph_captured", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompilationCounter.num_inductor_compiles", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompilationCounter.num_eager_compiles", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompilationCounter.num_cache_entries_updated", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompilationCounter.num_compiled_artifacts_saved", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompilationCounter.num_compiled_artifacts_loaded", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompilationCounter.stock_torch_compile_count", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 13, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.counter.compilation_counter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.compilation.counter", "names": [ "vllm.compilation.counter.CompilationCounter", "vllm.compilation.counter.compilation_counter" ], "n_typable": 4, "n_typed": 2, "n_any": 1, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_classes": 1, "n_attrs": 14, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/cuda_graph.py", "symbol_reports": [ { "kind": "class", "name": "vllm.compilation.cuda_graph.CUDAGraphOptions", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CUDAGraphOptions.debug_log_enable", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CUDAGraphOptions.gc_disable", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CUDAGraphOptions.weak_ref_output", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.cuda_graph.CUDAGraphStat", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CUDAGraphStat.num_unpadded_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CUDAGraphStat.num_padded_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CUDAGraphStat.num_paddings", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CUDAGraphStat.runtime_mode", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.cuda_graph.CUDAGraphWrapper", "methods": [ { "kind": "function", "name": "CUDAGraphWrapper.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CUDAGraphWrapper.__getattr__", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CUDAGraphWrapper.unwrap", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CUDAGraphWrapper.__call__", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CUDAGraphWrapper.runnable", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CUDAGraphWrapper.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CUDAGraphWrapper.runtime_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CUDAGraphWrapper.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CUDAGraphWrapper.first_run_finished", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CUDAGraphWrapper.is_debugging_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CUDAGraphWrapper.graph_pool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CUDAGraphWrapper.cudagraph_options", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CUDAGraphWrapper.concrete_cudagraph_entries", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 20, "n_typed": 9, "n_any": 3, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.cuda_graph.CUDAGraphLogging", "methods": [ { "kind": "function", "name": "CUDAGraphLogging.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CUDAGraphLogging.reset", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CUDAGraphLogging.observe", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CUDAGraphLogging.generate_metric_table", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CUDAGraphLogging.log", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CUDAGraphLogging.COLUMN_HEADERS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CUDAGraphLogging.cg_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CUDAGraphLogging.cg_capture_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CUDAGraphLogging.settings_header", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.cuda_graph.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.cuda_graph.CUDAGraphEntry", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CUDAGraphEntry.batch_descriptor", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CUDAGraphEntry.cudagraph", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CUDAGraphEntry.output", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CUDAGraphEntry.input_addresses", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.compilation.cuda_graph", "names": [ "vllm.compilation.cuda_graph.CUDAGraphEntry", "vllm.compilation.cuda_graph.CUDAGraphLogging", "vllm.compilation.cuda_graph.CUDAGraphOptions", "vllm.compilation.cuda_graph.CUDAGraphStat", "vllm.compilation.cuda_graph.CUDAGraphWrapper", "vllm.compilation.cuda_graph.logger" ], "n_typable": 33, "n_typed": 18, "n_any": 3, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 11, "n_classes": 5, "n_attrs": 25, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/decorators.py", "symbol_reports": [ { "kind": "function", "name": "vllm.compilation.decorators.support_torch_compile", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 5, "n_typable": 5, "n_params": 4, "n_function_overloads": 5, "n_function_params": 4 }, { "kind": "function", "name": "vllm.compilation.decorators.maybe_use_cudagraph_partition_wrapper", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.compilation.decorators.ignore_torch_compile", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.compilation.decorators.IGNORE_COMPILE_KEY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.compilation.decorators.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.compilation.decorators", "names": [ "vllm.compilation.decorators.IGNORE_COMPILE_KEY", "vllm.compilation.decorators.ignore_torch_compile", "vllm.compilation.decorators.logger", "vllm.compilation.decorators.maybe_use_cudagraph_partition_wrapper", "vllm.compilation.decorators.support_torch_compile" ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 3, "n_function_overloads": 7, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/monitor.py", "symbol_reports": [ { "kind": "function", "name": "vllm.compilation.monitor.end_monitoring_torch_compile", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.compilation.monitor.cudagraph_capturing_enabled", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.compilation.monitor.context_manager", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.compilation.monitor.start_monitoring_torch_compile", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.compilation.monitor.validate_cudagraph_capturing_enabled", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.compilation.monitor.set_cudagraph_capturing_enabled", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.compilation.monitor.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.compilation.monitor.torch_compile_start_time", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.compilation.monitor", "names": [ "vllm.compilation.monitor.context_manager", "vllm.compilation.monitor.cudagraph_capturing_enabled", "vllm.compilation.monitor.end_monitoring_torch_compile", "vllm.compilation.monitor.logger", "vllm.compilation.monitor.set_cudagraph_capturing_enabled", "vllm.compilation.monitor.start_monitoring_torch_compile", "vllm.compilation.monitor.torch_compile_start_time", "vllm.compilation.monitor.validate_cudagraph_capturing_enabled" ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/partition_rules.py", "symbol_reports": [ { "kind": "function", "name": "vllm.compilation.partition_rules.inductor_partition_rule_context", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.compilation.partition_rules.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.compilation.partition_rules.should_split", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.compilation.partition_rules", "names": [ "vllm.compilation.partition_rules.inductor_partition_rule_context", "vllm.compilation.partition_rules.logger", "vllm.compilation.partition_rules.should_split" ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/fusion/act_quant_fusion.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.compilation.passes.fusion.act_quant_fusion.silu_and_mul_nvfp4_quant_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.act_quant_fusion.ActivationQuantPattern", "methods": [ { "kind": "function", "name": "ActivationQuantPattern.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ActivationQuantPattern.empty_quant", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ActivationQuantPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ActivationQuantPattern.quant_key", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ActivationQuantPattern.quant_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ActivationQuantPattern.QUANT_OP", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ActivationQuantPattern.FUSED_OP", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ActivationQuantPattern.silu_and_mul_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 5, "n_any": 2, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.act_quant_fusion.FP8_DTYPE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.act_quant_fusion.ActivationQuantFusionPass", "methods": [ { "kind": "function", "name": "ActivationQuantFusionPass.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ActivationQuantFusionPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ActivationQuantFusionPass.uuid", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ActivationQuantFusionPass.patterns", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.act_quant_fusion.FUSED_OPS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.act_quant_fusion.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.act_quant_fusion.SiluMulNvfp4QuantPattern", "methods": [ { "kind": "function", "name": "SiluMulNvfp4QuantPattern.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SiluMulNvfp4QuantPattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SiluMulNvfp4QuantPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.act_quant_fusion.SiluMulFp8StaticQuantPattern", "methods": [ { "kind": "function", "name": "SiluMulFp8StaticQuantPattern.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SiluMulFp8StaticQuantPattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SiluMulFp8StaticQuantPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiluMulFp8StaticQuantPattern.quant_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.compilation.passes.fusion.act_quant_fusion", "names": [ "vllm.compilation.passes.fusion.act_quant_fusion.ActivationQuantFusionPass", "vllm.compilation.passes.fusion.act_quant_fusion.ActivationQuantPattern", "vllm.compilation.passes.fusion.act_quant_fusion.FP8_DTYPE", "vllm.compilation.passes.fusion.act_quant_fusion.FUSED_OPS", "vllm.compilation.passes.fusion.act_quant_fusion.SiluMulFp8StaticQuantPattern", "vllm.compilation.passes.fusion.act_quant_fusion.SiluMulNvfp4QuantPattern", "vllm.compilation.passes.fusion.act_quant_fusion.logger", "vllm.compilation.passes.fusion.act_quant_fusion.silu_and_mul_nvfp4_quant_supported" ], "n_typable": 31, "n_typed": 20, "n_any": 2, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 8, "n_classes": 4, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/fusion/allreduce_rms_fusion.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.FI_ALLREDUCE_FUSION_MAX_SIZE_MB", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.call_trtllm_fused_allreduce_norm_fake", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.AllReduceFusedAddRMSNormStaticQuantFP8Pattern", "methods": [ { "kind": "function", "name": "AllReduceFusedAddRMSNormStaticQuantFP8Pattern.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AllReduceFusedAddRMSNormStaticQuantFP8Pattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AllReduceFusedAddRMSNormStaticQuantFP8Pattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AllReduceFusedAddRMSNormStaticQuantFP8Pattern.epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusedAddRMSNormStaticQuantFP8Pattern.allreduce_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusedAddRMSNormStaticQuantFP8Pattern.quant_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusedAddRMSNormStaticQuantFP8Pattern.rmsnorm_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusedAddRMSNormStaticQuantFP8Pattern.quant_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.AllReduceFusionPass", "methods": [ { "kind": "function", "name": "AllReduceFusionPass.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AllReduceFusionPass.register_patterns", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AllReduceFusionPass.is_applicable_for_range", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AllReduceFusionPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AllReduceFusionPass.__del__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AllReduceFusionPass.disabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusionPass.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusionPass.patterns", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusionPass.hidden_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusionPass.group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusionPass.max_token_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusionPass.allreduce_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 9, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 3, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.FP8_DTYPE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.AllReduceFusedAddRMSNormStaticQuantNVFP4Pattern", "methods": [ { "kind": "function", "name": "AllReduceFusedAddRMSNormStaticQuantNVFP4Pattern.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AllReduceFusedAddRMSNormStaticQuantNVFP4Pattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AllReduceFusedAddRMSNormStaticQuantNVFP4Pattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AllReduceFusedAddRMSNormStaticQuantNVFP4Pattern.epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusedAddRMSNormStaticQuantNVFP4Pattern.allreduce_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusedAddRMSNormStaticQuantNVFP4Pattern.rmsnorm_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.AllReduceRMSNormPattern", "methods": [ { "kind": "function", "name": "AllReduceRMSNormPattern.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AllReduceRMSNormPattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AllReduceRMSNormPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AllReduceRMSNormPattern.epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceRMSNormPattern.allreduce_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceRMSNormPattern.rmsnorm_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.AllReduceFusedRMSNormStaticQuantFP8Pattern", "methods": [ { "kind": "function", "name": "AllReduceFusedRMSNormStaticQuantFP8Pattern.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AllReduceFusedRMSNormStaticQuantFP8Pattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AllReduceFusedRMSNormStaticQuantFP8Pattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AllReduceFusedRMSNormStaticQuantFP8Pattern.epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusedRMSNormStaticQuantFP8Pattern.allreduce_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusedRMSNormStaticQuantFP8Pattern.quant_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusedRMSNormStaticQuantFP8Pattern.rmsnorm_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusedRMSNormStaticQuantFP8Pattern.quant_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.BasePattern", "methods": [ { "kind": "function", "name": "BasePattern.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BasePattern.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BasePattern.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BasePattern.tp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BasePattern.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 3, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.flashinfer_comm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.AllReduceFusedRMSNormStaticQuantNVFP4Pattern", "methods": [ { "kind": "function", "name": "AllReduceFusedRMSNormStaticQuantNVFP4Pattern.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AllReduceFusedRMSNormStaticQuantNVFP4Pattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AllReduceFusedRMSNormStaticQuantNVFP4Pattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AllReduceFusedRMSNormStaticQuantNVFP4Pattern.epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusedRMSNormStaticQuantNVFP4Pattern.allreduce_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusedRMSNormStaticQuantNVFP4Pattern.rmsnorm_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.FlashInferFusedAllReduceParams", "methods": [ { "kind": "function", "name": "FlashInferFusedAllReduceParams.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlashInferFusedAllReduceParams.get_trtllm_fused_allreduce_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferFusedAllReduceParams.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferFusedAllReduceParams.launch_with_pdl", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferFusedAllReduceParams.fp32_acc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferFusedAllReduceParams.max_token_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 4, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.AllReduceFusedAddRMSNormPattern", "methods": [ { "kind": "function", "name": "AllReduceFusedAddRMSNormPattern.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AllReduceFusedAddRMSNormPattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AllReduceFusedAddRMSNormPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AllReduceFusedAddRMSNormPattern.epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusedAddRMSNormPattern.allreduce_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AllReduceFusedAddRMSNormPattern.rmsnorm_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.call_trtllm_fused_allreduce_norm", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion.MiB", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.compilation.passes.fusion.allreduce_rms_fusion", "names": [ "vllm.compilation.passes.fusion.allreduce_rms_fusion.AllReduceFusedAddRMSNormPattern", "vllm.compilation.passes.fusion.allreduce_rms_fusion.AllReduceFusedAddRMSNormStaticQuantFP8Pattern", "vllm.compilation.passes.fusion.allreduce_rms_fusion.AllReduceFusedAddRMSNormStaticQuantNVFP4Pattern", "vllm.compilation.passes.fusion.allreduce_rms_fusion.AllReduceFusedRMSNormStaticQuantFP8Pattern", "vllm.compilation.passes.fusion.allreduce_rms_fusion.AllReduceFusedRMSNormStaticQuantNVFP4Pattern", "vllm.compilation.passes.fusion.allreduce_rms_fusion.AllReduceFusionPass", "vllm.compilation.passes.fusion.allreduce_rms_fusion.AllReduceRMSNormPattern", "vllm.compilation.passes.fusion.allreduce_rms_fusion.BasePattern", "vllm.compilation.passes.fusion.allreduce_rms_fusion.FI_ALLREDUCE_FUSION_MAX_SIZE_MB", "vllm.compilation.passes.fusion.allreduce_rms_fusion.FP8_DTYPE", "vllm.compilation.passes.fusion.allreduce_rms_fusion.FlashInferFusedAllReduceParams", "vllm.compilation.passes.fusion.allreduce_rms_fusion.MiB", "vllm.compilation.passes.fusion.allreduce_rms_fusion.call_trtllm_fused_allreduce_norm", "vllm.compilation.passes.fusion.allreduce_rms_fusion.call_trtllm_fused_allreduce_norm_fake", "vllm.compilation.passes.fusion.allreduce_rms_fusion.flashinfer_comm", "vllm.compilation.passes.fusion.allreduce_rms_fusion.logger" ], "n_typable": 132, "n_typed": 94, "n_any": 0, "n_untyped": 38, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 26, "n_methods": 26, "n_method_overloads": 26, "n_method_params": 37, "n_classes": 9, "n_attrs": 42, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/fusion/attn_quant_fusion.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.compilation.passes.fusion.attn_quant_fusion.P", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.attn_quant_fusion.AttentionFp8StaticQuantPattern", "methods": [ { "kind": "function", "name": "AttentionFp8StaticQuantPattern.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AttentionFp8StaticQuantPattern._register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AttentionFp8StaticQuantPattern.quant_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.attn_quant_fusion.AttentionQuantPattern", "methods": [ { "kind": "function", "name": "AttentionQuantPattern.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AttentionQuantPattern.empty", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AttentionQuantPattern.empty_quant", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AttentionQuantPattern.wrap_trace_fn", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AttentionQuantPattern.fx_view_to_reshape", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttentionQuantPattern.remove_noop_permutes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttentionQuantPattern.register_if_supported", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttentionQuantPattern._register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AttentionQuantPattern.layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AttentionQuantPattern.layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AttentionQuantPattern.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AttentionQuantPattern.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AttentionQuantPattern.quant_key", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AttentionQuantPattern.quant_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AttentionQuantPattern.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AttentionQuantPattern.QUANT_OP", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 17, "n_any": 4, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 13, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.attn_quant_fusion.AttnFusionPass", "methods": [ { "kind": "function", "name": "AttnFusionPass.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttnFusionPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttnFusionPass.uuid", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AttnFusionPass.patterns", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.attn_quant_fusion.FP8_DTYPE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.attn_quant_fusion.AttentionNvfp4QuantPattern", "methods": [ { "kind": "function", "name": "AttentionNvfp4QuantPattern.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AttentionNvfp4QuantPattern._register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.attn_quant_fusion.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.compilation.passes.fusion.attn_quant_fusion", "names": [ "vllm.compilation.passes.fusion.attn_quant_fusion.AttentionFp8StaticQuantPattern", "vllm.compilation.passes.fusion.attn_quant_fusion.AttentionNvfp4QuantPattern", "vllm.compilation.passes.fusion.attn_quant_fusion.AttentionQuantPattern", "vllm.compilation.passes.fusion.attn_quant_fusion.AttnFusionPass", "vllm.compilation.passes.fusion.attn_quant_fusion.FP8_DTYPE", "vllm.compilation.passes.fusion.attn_quant_fusion.P", "vllm.compilation.passes.fusion.attn_quant_fusion.logger" ], "n_typable": 49, "n_typed": 33, "n_any": 4, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 22, "n_classes": 4, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/fusion/collective_fusion.py", "symbol_reports": [ { "kind": "class", "name": "vllm.compilation.passes.fusion.collective_fusion.AllGatherCutlassScaledMMPattern", "methods": [ { "kind": "function", "name": "AllGatherCutlassScaledMMPattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AllGatherCutlassScaledMMPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.collective_fusion.ScaledMMReduceScatterPattern", "methods": [ { "kind": "function", "name": "ScaledMMReduceScatterPattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScaledMMReduceScatterPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.collective_fusion.AsyncTPPass", "methods": [ { "kind": "function", "name": "AsyncTPPass.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncTPPass.is_applicable_for_range", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncTPPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AsyncTPPass.patterns", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.collective_fusion.FP8_DTYPE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.collective_fusion.GEMMReduceScatterPattern", "methods": [ { "kind": "function", "name": "GEMMReduceScatterPattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GEMMReduceScatterPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.collective_fusion.BasePattern", "methods": [ { "kind": "function", "name": "BasePattern.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BasePattern.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BasePattern.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BasePattern.tp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BasePattern.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 3, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.collective_fusion.AllGatherGEMMPattern", "methods": [ { "kind": "function", "name": "AllGatherGEMMPattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AllGatherGEMMPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.collective_fusion.AllGatherScaledMMPattern", "methods": [ { "kind": "function", "name": "AllGatherScaledMMPattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AllGatherScaledMMPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.collective_fusion.CutlassScaledMMReduceScatterPattern", "methods": [ { "kind": "function", "name": "CutlassScaledMMReduceScatterPattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassScaledMMReduceScatterPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.collective_fusion.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.compilation.passes.fusion.collective_fusion", "names": [ "vllm.compilation.passes.fusion.collective_fusion.AllGatherCutlassScaledMMPattern", "vllm.compilation.passes.fusion.collective_fusion.AllGatherGEMMPattern", "vllm.compilation.passes.fusion.collective_fusion.AllGatherScaledMMPattern", "vllm.compilation.passes.fusion.collective_fusion.AsyncTPPass", "vllm.compilation.passes.fusion.collective_fusion.BasePattern", "vllm.compilation.passes.fusion.collective_fusion.CutlassScaledMMReduceScatterPattern", "vllm.compilation.passes.fusion.collective_fusion.FP8_DTYPE", "vllm.compilation.passes.fusion.collective_fusion.GEMMReduceScatterPattern", "vllm.compilation.passes.fusion.collective_fusion.ScaledMMReduceScatterPattern", "vllm.compilation.passes.fusion.collective_fusion.logger" ], "n_typable": 34, "n_typed": 28, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 11, "n_classes": 8, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/fusion/matcher_utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.compilation.passes.fusion.matcher_utils.MatcherFusedAddRMSNorm", "methods": [ { "kind": "function", "name": "MatcherFusedAddRMSNorm.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MatcherFusedAddRMSNorm.inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MatcherFusedAddRMSNorm.forward_rocm_aiter", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MatcherFusedAddRMSNorm.forward_custom", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MatcherFusedAddRMSNorm.forward_native", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MatcherFusedAddRMSNorm.epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherFusedAddRMSNorm.match_rocm_aiter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 17, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.matcher_utils.MatcherRotaryEmbedding", "methods": [ { "kind": "function", "name": "MatcherRotaryEmbedding.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "MatcherRotaryEmbedding.inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MatcherRotaryEmbedding.forward_custom", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MatcherRotaryEmbedding.forward_native", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MatcherRotaryEmbedding.is_neox", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherRotaryEmbedding.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherRotaryEmbedding.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherRotaryEmbedding.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherRotaryEmbedding.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherRotaryEmbedding.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherRotaryEmbedding.rotary_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherRotaryEmbedding.rotary_op", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 19, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 15, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.matcher_utils.QUANT_OPS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.matcher_utils.MatcherSiluAndMul", "methods": [ { "kind": "function", "name": "MatcherSiluAndMul.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MatcherSiluAndMul.inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MatcherSiluAndMul.forward_custom", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MatcherSiluAndMul.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.matcher_utils.MatcherQuantFP8", "methods": [ { "kind": "function", "name": "MatcherQuantFP8.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MatcherQuantFP8.forward_rocm_aiter", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MatcherQuantFP8.forward_custom", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MatcherQuantFP8.forward_native", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MatcherQuantFP8.make_scale", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MatcherQuantFP8.inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MatcherQuantFP8.quant_key", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherQuantFP8.has_col_major_scales", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherQuantFP8.is_e8m0", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherQuantFP8.match_rocm_aiter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherQuantFP8.is_tma_aligned", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherQuantFP8.quant_fp8", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherQuantFP8.QUANT_OP", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 20, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.matcher_utils.MatcherRMSNorm", "methods": [ { "kind": "function", "name": "MatcherRMSNorm.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MatcherRMSNorm.inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MatcherRMSNorm.forward_rocm_aiter", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MatcherRMSNorm.forward_custom", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MatcherRMSNorm.forward_native", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MatcherRMSNorm.epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherRMSNorm.match_rocm_aiter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 14, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.matcher_utils.MatcherCustomOp", "methods": [ { "kind": "function", "name": "MatcherCustomOp.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MatcherCustomOp.forward_custom", "n_typed": 0, "n_any": 3, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MatcherCustomOp.forward_native", "n_typed": 0, "n_any": 3, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MatcherCustomOp.__call__", "n_typed": 0, "n_any": 3, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MatcherCustomOp.empty", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MatcherCustomOp.empty_int64", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MatcherCustomOp.empty_f32", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MatcherCustomOp.inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MatcherCustomOp.model_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherCustomOp.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherCustomOp.enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MatcherCustomOp.forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 6, "n_any": 15, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 13, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.compilation.passes.fusion.matcher_utils", "names": [ "vllm.compilation.passes.fusion.matcher_utils.MatcherCustomOp", "vllm.compilation.passes.fusion.matcher_utils.MatcherFusedAddRMSNorm", "vllm.compilation.passes.fusion.matcher_utils.MatcherQuantFP8", "vllm.compilation.passes.fusion.matcher_utils.MatcherRMSNorm", "vllm.compilation.passes.fusion.matcher_utils.MatcherRotaryEmbedding", "vllm.compilation.passes.fusion.matcher_utils.MatcherSiluAndMul", "vllm.compilation.passes.fusion.matcher_utils.QUANT_OPS" ], "n_typable": 122, "n_typed": 84, "n_any": 15, "n_untyped": 23, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 32, "n_method_overloads": 32, "n_method_params": 66, "n_classes": 6, "n_attrs": 24, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/fusion/qk_norm_rope_fusion.py", "symbol_reports": [ { "kind": "class", "name": "vllm.compilation.passes.fusion.qk_norm_rope_fusion.QKNormRoPEFusionPass", "methods": [ { "kind": "function", "name": "QKNormRoPEFusionPass.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QKNormRoPEFusionPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QKNormRoPEFusionPass.uuid", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QKNormRoPEFusionPass.patterns", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.qk_norm_rope_fusion.QkNormRopePattern", "methods": [ { "kind": "function", "name": "QkNormRopePattern.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "QkNormRopePattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QkNormRopePattern.wrap_trace_fn", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QkNormRopePattern.fx_view_to_reshape", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QkNormRopePattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QkNormRopePattern.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QkNormRopePattern.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QkNormRopePattern.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QkNormRopePattern.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QkNormRopePattern.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QkNormRopePattern.eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QkNormRopePattern.rmsnorm_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QkNormRopePattern.is_neox", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QkNormRopePattern.rope_flashinfer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QkNormRopePattern.rope_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 15, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.qk_norm_rope_fusion.P", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.qk_norm_rope_fusion.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.compilation.passes.fusion.qk_norm_rope_fusion", "names": [ "vllm.compilation.passes.fusion.qk_norm_rope_fusion.P", "vllm.compilation.passes.fusion.qk_norm_rope_fusion.QKNormRoPEFusionPass", "vllm.compilation.passes.fusion.qk_norm_rope_fusion.QkNormRopePattern", "vllm.compilation.passes.fusion.qk_norm_rope_fusion.logger" ], "n_typable": 32, "n_typed": 21, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 12, "n_classes": 2, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/fusion/rms_quant_fusion.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.empty_fp32", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.RMSNormGroupQuantPattern", "methods": [ { "kind": "function", "name": "RMSNormGroupQuantPattern.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "RMSNormGroupQuantPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RMSNormGroupQuantPattern.group_shape", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNormGroupQuantPattern.has_col_major_scales", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNormGroupQuantPattern.is_tma_aligned", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 10, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.FusedAddRMSNormStaticQuantPattern", "methods": [ { "kind": "function", "name": "FusedAddRMSNormStaticQuantPattern.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FusedAddRMSNormStaticQuantPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.QUANT_OPS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.FP8_DTYPE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.empty_i32", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.RMSNormStaticQuantPattern", "methods": [ { "kind": "function", "name": "RMSNormStaticQuantPattern.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RMSNormStaticQuantPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.RMSNormQuantPattern", "methods": [ { "kind": "function", "name": "RMSNormQuantPattern.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RMSNormQuantPattern.epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNormQuantPattern.quant_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNormQuantPattern.model_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNormQuantPattern.FUSED_OP", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNormQuantPattern.rmsnorm_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNormQuantPattern.quant_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 6, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.RMSNormQuantFusionPass", "methods": [ { "kind": "function", "name": "RMSNormQuantFusionPass.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RMSNormQuantFusionPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RMSNormQuantFusionPass.uuid", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RMSNormQuantFusionPass.patterns", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.FUSED_OPS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.empty_bf16", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.empty_i64", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.FusedAddRMSNormDynamicQuantPattern", "methods": [ { "kind": "function", "name": "FusedAddRMSNormDynamicQuantPattern.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FusedAddRMSNormDynamicQuantPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.FusedRMSQuantKey", "methods": [ { "kind": "function", "name": "FusedRMSQuantKey.__str__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FusedRMSQuantKey.quant", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedRMSQuantKey.fused_add", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.FusedAddRMSNormGroupQuantPattern", "methods": [ { "kind": "function", "name": "FusedAddRMSNormGroupQuantPattern.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "FusedAddRMSNormGroupQuantPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FusedAddRMSNormGroupQuantPattern.group_shape", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedAddRMSNormGroupQuantPattern.is_e8m0", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedAddRMSNormGroupQuantPattern.has_col_major_scales", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedAddRMSNormGroupQuantPattern.is_tma_aligned", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 10, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rms_quant_fusion.RMSNormDynamicQuantPattern", "methods": [ { "kind": "function", "name": "RMSNormDynamicQuantPattern.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "RMSNormDynamicQuantPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.compilation.passes.fusion.rms_quant_fusion", "names": [ "vllm.compilation.passes.fusion.rms_quant_fusion.FP8_DTYPE", "vllm.compilation.passes.fusion.rms_quant_fusion.FUSED_OPS", "vllm.compilation.passes.fusion.rms_quant_fusion.FusedAddRMSNormDynamicQuantPattern", "vllm.compilation.passes.fusion.rms_quant_fusion.FusedAddRMSNormGroupQuantPattern", "vllm.compilation.passes.fusion.rms_quant_fusion.FusedAddRMSNormStaticQuantPattern", "vllm.compilation.passes.fusion.rms_quant_fusion.FusedRMSQuantKey", "vllm.compilation.passes.fusion.rms_quant_fusion.QUANT_OPS", "vllm.compilation.passes.fusion.rms_quant_fusion.RMSNormDynamicQuantPattern", "vllm.compilation.passes.fusion.rms_quant_fusion.RMSNormGroupQuantPattern", "vllm.compilation.passes.fusion.rms_quant_fusion.RMSNormQuantFusionPass", "vllm.compilation.passes.fusion.rms_quant_fusion.RMSNormQuantPattern", "vllm.compilation.passes.fusion.rms_quant_fusion.RMSNormStaticQuantPattern", "vllm.compilation.passes.fusion.rms_quant_fusion.empty_bf16", "vllm.compilation.passes.fusion.rms_quant_fusion.empty_fp32", "vllm.compilation.passes.fusion.rms_quant_fusion.empty_i32", "vllm.compilation.passes.fusion.rms_quant_fusion.empty_i64", "vllm.compilation.passes.fusion.rms_quant_fusion.logger" ], "n_typable": 88, "n_typed": 65, "n_any": 8, "n_untyped": 15, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 8, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 41, "n_classes": 9, "n_attrs": 20, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/fusion/rocm_aiter_fusion.py", "symbol_reports": [ { "kind": "class", "name": "vllm.compilation.passes.fusion.rocm_aiter_fusion.AiterRMSNormDynamicQuantPattern", "methods": [ { "kind": "function", "name": "AiterRMSNormDynamicQuantPattern.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "AiterRMSNormDynamicQuantPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterRMSNormDynamicQuantPattern.FUSED_OP", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rocm_aiter_fusion.AiterRMSFp8GroupQuantPattern", "methods": [ { "kind": "function", "name": "AiterRMSFp8GroupQuantPattern.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "AiterRMSFp8GroupQuantPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterRMSFp8GroupQuantPattern.FUSED_OP", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rocm_aiter_fusion.RocmAiterRMSNormQuantFusionPass", "methods": [ { "kind": "function", "name": "RocmAiterRMSNormQuantFusionPass.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmAiterRMSNormQuantFusionPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmAiterRMSNormQuantFusionPass.uuid", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RocmAiterRMSNormQuantFusionPass.patterns", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rocm_aiter_fusion.AddAiterRMSNormPadPattern", "methods": [ { "kind": "function", "name": "AddAiterRMSNormPadPattern.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AddAiterRMSNormPadPattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AddAiterRMSNormPadPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AddAiterRMSNormPadPattern.AITER_TRITON_ADD_RMSNORM_PAD_OP", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AddAiterRMSNormPadPattern.epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AddAiterRMSNormPadPattern.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AddAiterRMSNormPadPattern.x_pad_to_multiple", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AddAiterRMSNormPadPattern.rmsnorm_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 6, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rocm_aiter_fusion.AiterSiluMulFp8GroupQuantPattern", "methods": [ { "kind": "function", "name": "AiterSiluMulFp8GroupQuantPattern.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterSiluMulFp8GroupQuantPattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterSiluMulFp8GroupQuantPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterSiluMulFp8GroupQuantPattern.FUSED_SILU_MUL_QUANT_OP", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterSiluMulFp8GroupQuantPattern.silu_and_mul_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterSiluMulFp8GroupQuantPattern.quant_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 4, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.rocm_aiter_fusion.FP8_DTYPE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rocm_aiter_fusion.AiterFusedAddRMSFp8GroupQuantPattern", "methods": [ { "kind": "function", "name": "AiterFusedAddRMSFp8GroupQuantPattern.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "AiterFusedAddRMSFp8GroupQuantPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterFusedAddRMSFp8GroupQuantPattern.FUSED_OP", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rocm_aiter_fusion.AiterFusedAddRMSNormDynamicQuantPattern", "methods": [ { "kind": "function", "name": "AiterFusedAddRMSNormDynamicQuantPattern.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "AiterFusedAddRMSNormDynamicQuantPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterFusedAddRMSNormDynamicQuantPattern.FUSED_OP", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rocm_aiter_fusion.RocmAiterSiluMulFp8GroupQuantFusionPass", "methods": [ { "kind": "function", "name": "RocmAiterSiluMulFp8GroupQuantFusionPass.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmAiterSiluMulFp8GroupQuantFusionPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmAiterSiluMulFp8GroupQuantFusionPass.uuid", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RocmAiterSiluMulFp8GroupQuantFusionPass.patterns", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rocm_aiter_fusion.AiterRMSNormQuantPattern", "methods": [ { "kind": "function", "name": "AiterRMSNormQuantPattern.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterRMSNormQuantPattern.epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterRMSNormQuantPattern.quant_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterRMSNormQuantPattern.rmsnorm_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterRMSNormQuantPattern.quant_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 3, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rocm_aiter_fusion.RocmAiterTritonAddRMSNormPadFusionPass", "methods": [ { "kind": "function", "name": "RocmAiterTritonAddRMSNormPadFusionPass.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmAiterTritonAddRMSNormPadFusionPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmAiterTritonAddRMSNormPadFusionPass.uuid", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RocmAiterTritonAddRMSNormPadFusionPass.patterns", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.rocm_aiter_fusion.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.compilation.passes.fusion.rocm_aiter_fusion", "names": [ "vllm.compilation.passes.fusion.rocm_aiter_fusion.AddAiterRMSNormPadPattern", "vllm.compilation.passes.fusion.rocm_aiter_fusion.AiterFusedAddRMSFp8GroupQuantPattern", "vllm.compilation.passes.fusion.rocm_aiter_fusion.AiterFusedAddRMSNormDynamicQuantPattern", "vllm.compilation.passes.fusion.rocm_aiter_fusion.AiterRMSFp8GroupQuantPattern", "vllm.compilation.passes.fusion.rocm_aiter_fusion.AiterRMSNormDynamicQuantPattern", "vllm.compilation.passes.fusion.rocm_aiter_fusion.AiterRMSNormQuantPattern", "vllm.compilation.passes.fusion.rocm_aiter_fusion.AiterSiluMulFp8GroupQuantPattern", "vllm.compilation.passes.fusion.rocm_aiter_fusion.FP8_DTYPE", "vllm.compilation.passes.fusion.rocm_aiter_fusion.RocmAiterRMSNormQuantFusionPass", "vllm.compilation.passes.fusion.rocm_aiter_fusion.RocmAiterSiluMulFp8GroupQuantFusionPass", "vllm.compilation.passes.fusion.rocm_aiter_fusion.RocmAiterTritonAddRMSNormPadFusionPass", "vllm.compilation.passes.fusion.rocm_aiter_fusion.logger" ], "n_typable": 83, "n_typed": 62, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 24, "n_method_overloads": 24, "n_method_params": 38, "n_classes": 10, "n_attrs": 21, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/fusion/rope_kvcache_fusion.py", "symbol_reports": [ { "kind": "function", "name": "vllm.compilation.passes.fusion.rope_kvcache_fusion.fused_rope_and_unified_kv_cache_update_impl", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.compilation.passes.fusion.rope_kvcache_fusion.fused_rope_and_unified_kv_cache_update_fake", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rope_kvcache_fusion.RopeReshapeKVCachePattern", "methods": [ { "kind": "function", "name": "RopeReshapeKVCachePattern.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RopeReshapeKVCachePattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RopeReshapeKVCachePattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RopeReshapeKVCachePattern.FUSED_OP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RopeReshapeKVCachePattern.layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RopeReshapeKVCachePattern.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RopeReshapeKVCachePattern.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RopeReshapeKVCachePattern.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RopeReshapeKVCachePattern.head_size_v", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RopeReshapeKVCachePattern.is_neox", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RopeReshapeKVCachePattern.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RopeReshapeKVCachePattern.k_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RopeReshapeKVCachePattern.v_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RopeReshapeKVCachePattern.rope_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 6, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.rope_kvcache_fusion.RopeKVCacheFusionPass", "methods": [ { "kind": "function", "name": "RopeKVCacheFusionPass.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RopeKVCacheFusionPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RopeKVCacheFusionPass.is_applicable_for_range", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RopeKVCacheFusionPass.uuid", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RopeKVCacheFusionPass.patterns", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RopeKVCacheFusionPass.max_token_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.rope_kvcache_fusion.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.compilation.passes.fusion.rope_kvcache_fusion", "names": [ "vllm.compilation.passes.fusion.rope_kvcache_fusion.RopeKVCacheFusionPass", "vllm.compilation.passes.fusion.rope_kvcache_fusion.RopeReshapeKVCachePattern", "vllm.compilation.passes.fusion.rope_kvcache_fusion.fused_rope_and_unified_kv_cache_update_fake", "vllm.compilation.passes.fusion.rope_kvcache_fusion.fused_rope_and_unified_kv_cache_update_impl", "vllm.compilation.passes.fusion.rope_kvcache_fusion.logger" ], "n_typable": 42, "n_typed": 30, "n_any": 0, "n_untyped": 12, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 14, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 6, "n_classes": 2, "n_attrs": 14, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/fusion/sequence_parallelism.py", "symbol_reports": [ { "kind": "function", "name": "vllm.compilation.passes.fusion.sequence_parallelism.get_sequence_parallelism_threshold", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.sequence_parallelism.MiddleAllReduceRMSNormPattern", "methods": [ { "kind": "function", "name": "MiddleAllReduceRMSNormPattern.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiddleAllReduceRMSNormPattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiddleAllReduceRMSNormPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiddleAllReduceRMSNormPattern.rmsnorm_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.sequence_parallelism.FirstAllReduceRMSNormPattern", "methods": [ { "kind": "function", "name": "FirstAllReduceRMSNormPattern.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FirstAllReduceRMSNormPattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FirstAllReduceRMSNormPattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FirstAllReduceRMSNormPattern.rmsnorm_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.sequence_parallelism.SequenceParallelismPass", "methods": [ { "kind": "function", "name": "SequenceParallelismPass.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SequenceParallelismPass.is_applicable_for_range", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SequenceParallelismPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SequenceParallelismPass.min_token_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SequenceParallelismPass.noop_cleanup", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SequenceParallelismPass.patterns", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.compilation.passes.fusion.sequence_parallelism.get_first_out_wrapper", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.sequence_parallelism.MiddleAllReduceRMSNormStaticFP8Pattern", "methods": [ { "kind": "function", "name": "MiddleAllReduceRMSNormStaticFP8Pattern.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiddleAllReduceRMSNormStaticFP8Pattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiddleAllReduceRMSNormStaticFP8Pattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiddleAllReduceRMSNormStaticFP8Pattern.rmsnorm_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiddleAllReduceRMSNormStaticFP8Pattern.quant_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.sequence_parallelism.SP_MIN_HIDDEN_SIZE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.passes.fusion.sequence_parallelism.FirstAllReduceRMSNormStaticFP8Pattern", "methods": [ { "kind": "function", "name": "FirstAllReduceRMSNormStaticFP8Pattern.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FirstAllReduceRMSNormStaticFP8Pattern.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FirstAllReduceRMSNormStaticFP8Pattern.register", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FirstAllReduceRMSNormStaticFP8Pattern.rmsnorm_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FirstAllReduceRMSNormStaticFP8Pattern.quant_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.sequence_parallelism.SP_MIN_PER_GPU_SIZE_MB", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.compilation.passes.fusion.sequence_parallelism.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.compilation.passes.fusion.sequence_parallelism", "names": [ "vllm.compilation.passes.fusion.sequence_parallelism.FirstAllReduceRMSNormPattern", "vllm.compilation.passes.fusion.sequence_parallelism.FirstAllReduceRMSNormStaticFP8Pattern", "vllm.compilation.passes.fusion.sequence_parallelism.MiddleAllReduceRMSNormPattern", "vllm.compilation.passes.fusion.sequence_parallelism.MiddleAllReduceRMSNormStaticFP8Pattern", "vllm.compilation.passes.fusion.sequence_parallelism.SP_MIN_HIDDEN_SIZE", "vllm.compilation.passes.fusion.sequence_parallelism.SP_MIN_PER_GPU_SIZE_MB", "vllm.compilation.passes.fusion.sequence_parallelism.SequenceParallelismPass", "vllm.compilation.passes.fusion.sequence_parallelism.get_first_out_wrapper", "vllm.compilation.passes.fusion.sequence_parallelism.get_sequence_parallelism_threshold", "vllm.compilation.passes.fusion.sequence_parallelism.logger" ], "n_typable": 52, "n_typed": 43, "n_any": 0, "n_untyped": 9, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 4, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 19, "n_classes": 5, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/fx_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.compilation.passes.fx_utils.find_op_nodes", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.compilation.passes.fx_utils.get_only_user", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.compilation.passes.fx_utils.is_auto_func", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.compilation.passes.fx_utils.find_getitem_maybe", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.compilation.passes.fx_utils.find_getitem", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.compilation.passes.fx_utils.find_auto_fn_maybe", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.compilation.passes.fx_utils.find_auto_fn", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.compilation.passes.fx_utils.is_func", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.compilation.passes.fx_utils", "names": [ "vllm.compilation.passes.fx_utils.find_auto_fn", "vllm.compilation.passes.fx_utils.find_auto_fn_maybe", "vllm.compilation.passes.fx_utils.find_getitem", "vllm.compilation.passes.fx_utils.find_getitem_maybe", "vllm.compilation.passes.fx_utils.find_op_nodes", "vllm.compilation.passes.fx_utils.get_only_user", "vllm.compilation.passes.fx_utils.is_auto_func", "vllm.compilation.passes.fx_utils.is_func" ], "n_typable": 23, "n_typed": 23, "n_any": 0, "n_untyped": 0, "n_functions": 8, "n_function_overloads": 8, "n_function_params": 15, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/inductor_pass.py", "symbol_reports": [ { "kind": "function", "name": "vllm.compilation.passes.inductor_pass.enable_fake_mode", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.compilation.passes.inductor_pass.CallableInductorPass", "methods": [ { "kind": "function", "name": "CallableInductorPass.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CallableInductorPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CallableInductorPass.uuid", "n_typed": 0, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CallableInductorPass.callable", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 1, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.inductor_pass.P", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.compilation.passes.inductor_pass.get_pass_context", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.compilation.passes.inductor_pass.pass_context", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.compilation.passes.inductor_pass.R", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.compilation.passes.inductor_pass.PassContext", "methods": [ { "kind": "function", "name": "PassContext.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PassContext.compile_range", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.inductor_pass.InductorPass", "methods": [ { "kind": "function", "name": "InductorPass.uuid", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InductorPass.hash_source", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InductorPass.hash_dict", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InductorPass.is_applicable_for_range", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": [ "misc" ] } ], "name": "vllm.compilation.passes.inductor_pass", "names": [ "vllm.compilation.passes.inductor_pass.CallableInductorPass", "vllm.compilation.passes.inductor_pass.InductorPass", "vllm.compilation.passes.inductor_pass.P", "vllm.compilation.passes.inductor_pass.PassContext", "vllm.compilation.passes.inductor_pass.R", "vllm.compilation.passes.inductor_pass.enable_fake_mode", "vllm.compilation.passes.inductor_pass.get_pass_context", "vllm.compilation.passes.inductor_pass.pass_context" ], "n_typable": 22, "n_typed": 19, "n_any": 1, "n_untyped": 2, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 2, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 7, "n_classes": 3, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/compilation/passes/pass_manager.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.compilation.passes.pass_manager.P", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.compilation.passes.pass_manager.with_pattern_match_debug", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.compilation.passes.pass_manager.R", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.pass_manager.fx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.compilation.passes.pass_manager.PostGradPassManager", "methods": [ { "kind": "function", "name": "PostGradPassManager.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PostGradPassManager.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PostGradPassManager.configure", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PostGradPassManager.add", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PostGradPassManager.uuid", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PostGradPassManager.passes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.pass_manager.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": [ "misc" ] } ], "name": "vllm.compilation.passes.pass_manager", "names": [ "vllm.compilation.passes.pass_manager.P", "vllm.compilation.passes.pass_manager.PostGradPassManager", "vllm.compilation.passes.pass_manager.R", "vllm.compilation.passes.pass_manager.fx", "vllm.compilation.passes.pass_manager.logger", "vllm.compilation.passes.pass_manager.with_pattern_match_debug" ], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 3, "n_classes": 1, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/compilation/passes/utility/fix_functionalization.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.compilation.passes.utility.fix_functionalization.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.passes.utility.fix_functionalization.FixFunctionalizationPass", "methods": [ { "kind": "function", "name": "FixFunctionalizationPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FixFunctionalizationPass._remove", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FixFunctionalizationPass.defunctionalize", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FixFunctionalizationPass.replace_users_with_mutated_args", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FixFunctionalizationPass.getitem_users", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FixFunctionalizationPass.insert_defunctionalized", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 18, "n_typed": 18, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.compilation.passes.utility.fix_functionalization", "names": [ "vllm.compilation.passes.utility.fix_functionalization.FixFunctionalizationPass", "vllm.compilation.passes.utility.fix_functionalization.logger" ], "n_typable": 19, "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/utility/noop_elimination.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.compilation.passes.utility.noop_elimination.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.passes.utility.noop_elimination.NoOpEliminationPass", "methods": [ { "kind": "function", "name": "NoOpEliminationPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NoOpEliminationPass.dims_equivalent", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NoOpEliminationPass.all_dims_equivalent", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.compilation.passes.utility.noop_elimination", "names": [ "vllm.compilation.passes.utility.noop_elimination.NoOpEliminationPass", "vllm.compilation.passes.utility.noop_elimination.logger" ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/utility/post_cleanup.py", "symbol_reports": [ { "kind": "class", "name": "vllm.compilation.passes.utility.post_cleanup.PostCleanupPass", "methods": [ { "kind": "function", "name": "PostCleanupPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.compilation.passes.utility.post_cleanup", "names": [ "vllm.compilation.passes.utility.post_cleanup.PostCleanupPass" ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/utility/scatter_split_replace.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.compilation.passes.utility.scatter_split_replace.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.passes.utility.scatter_split_replace.ScatterSplitReplacementPass", "methods": [ { "kind": "function", "name": "ScatterSplitReplacementPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.compilation.passes.utility.scatter_split_replace", "names": [ "vllm.compilation.passes.utility.scatter_split_replace.ScatterSplitReplacementPass", "vllm.compilation.passes.utility.scatter_split_replace.logger" ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/utility/split_coalescing.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.compilation.passes.utility.split_coalescing.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.passes.utility.split_coalescing.SplitCoalescingPass", "methods": [ { "kind": "function", "name": "SplitCoalescingPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.compilation.passes.utility.split_coalescing", "names": [ "vllm.compilation.passes.utility.split_coalescing.SplitCoalescingPass", "vllm.compilation.passes.utility.split_coalescing.logger" ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/passes/vllm_inductor_pass.py", "symbol_reports": [ { "kind": "class", "name": "vllm.compilation.passes.vllm_inductor_pass.InductorCompilationConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "InductorCompilationConfig.splitting_ops", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InductorCompilationConfig.use_inductor_graph_partition", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.vllm_inductor_pass.VllmPatternMatcherPass", "methods": [ { "kind": "function", "name": "VllmPatternMatcherPass._replace_op_overloads", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VllmPatternMatcherPass.dump_patterns", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VllmPatternMatcherPass.matched_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmPatternMatcherPass._OP_OVERLOAD_PATTERN", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.compilation.passes.vllm_inductor_pass.PrinterInductorPass", "methods": [ { "kind": "function", "name": "PrinterInductorPass.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PrinterInductorPass.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PrinterInductorPass.name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.passes.vllm_inductor_pass.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.passes.vllm_inductor_pass.VllmInductorPass", "methods": [ { "kind": "function", "name": "VllmInductorPass.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VllmInductorPass.time_and_log", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VllmInductorPass.dump_graph", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmInductorPass.begin", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VllmInductorPass.end_and_log", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VllmInductorPass.dump_prefix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmInductorPass.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmInductorPass.pass_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmInductorPass.model_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmInductorPass.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmInductorPass.pass_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.compilation.passes.vllm_inductor_pass", "names": [ "vllm.compilation.passes.vllm_inductor_pass.InductorCompilationConfig", "vllm.compilation.passes.vllm_inductor_pass.PrinterInductorPass", "vllm.compilation.passes.vllm_inductor_pass.VllmInductorPass", "vllm.compilation.passes.vllm_inductor_pass.VllmPatternMatcherPass", "vllm.compilation.passes.vllm_inductor_pass.logger" ], "n_typable": 29, "n_typed": 22, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 10, "n_classes": 4, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/compilation/piecewise_backend.py", "symbol_reports": [ { "kind": "class", "name": "vllm.compilation.piecewise_backend.PiecewiseBackend", "methods": [ { "kind": "function", "name": "PiecewiseBackend.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "PiecewiseBackend.get_compiled_graph_wrapper", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PiecewiseBackend.check_for_ending_compilation", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PiecewiseBackend.to_bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PiecewiseBackend._fakify_args", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PiecewiseBackend._log_compile_start", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PiecewiseBackend._maybe_compile_for_range_entry", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PiecewiseBackend._find_range_for_shape", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PiecewiseBackend.__call__", "n_typed": 0, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PiecewiseBackend.graph", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.piecewise_compile_index", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.total_piecewise_compiles", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.vllm_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.compiled_runnables", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.submod_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.is_first_graph", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.is_last_graph", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.is_full_graph", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.is_encoder_compilation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.compile_ranges", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.compile_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.sym_shape_indices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.returns_tuple", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.range_entries", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.to_be_compiled_ranges", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PiecewiseBackend.on_compilation_complete", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 44, "n_typed": 22, "n_any": 3, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 16, "n_attrs": 19, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.piecewise_backend.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.compilation.piecewise_backend.RangeEntry", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RangeEntry.compile_range", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RangeEntry.compiled", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RangeEntry.runnable", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": null } ], "name": "vllm.compilation.piecewise_backend", "names": [ "vllm.compilation.piecewise_backend.PiecewiseBackend", "vllm.compilation.piecewise_backend.RangeEntry", "vllm.compilation.piecewise_backend.logger" ], "n_typable": 45, "n_typed": 22, "n_any": 3, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 16, "n_classes": 2, "n_attrs": 23, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/compilation/wrapper.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.compilation.wrapper.P", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.compilation.wrapper.R", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.compilation.wrapper.TorchCompileWithNoGuardsWrapper", "methods": [ { "kind": "function", "name": "TorchCompileWithNoGuardsWrapper.check_invariants_and_forward", "n_typed": 0, "n_any": 3, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TorchCompileWithNoGuardsWrapper._call_with_optional_nvtx_range", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TorchCompileWithNoGuardsWrapper.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TorchCompileWithNoGuardsWrapper.aot_compile", "n_typed": 0, "n_any": 3, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TorchCompileWithNoGuardsWrapper.__call__", "n_typed": 0, "n_any": 3, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TorchCompileWithNoGuardsWrapper.forward", "n_typed": 0, "n_any": 3, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TorchCompileWithNoGuardsWrapper.original_code_object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TorchCompileWithNoGuardsWrapper.bytecode_hook", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TorchCompileWithNoGuardsWrapper._dispatch_to_compiled_code", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TorchCompileWithNoGuardsWrapper.compiled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TorchCompileWithNoGuardsWrapper.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TorchCompileWithNoGuardsWrapper.layerwise_nvtx_tracing_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TorchCompileWithNoGuardsWrapper.first_compile", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TorchCompileWithNoGuardsWrapper.evaluate_guards", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 9, "n_any": 13, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 13, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.compilation.wrapper.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.compilation.wrapper.reset_compile_wrapper", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.compilation.wrapper", "names": [ "vllm.compilation.wrapper.P", "vllm.compilation.wrapper.R", "vllm.compilation.wrapper.TorchCompileWithNoGuardsWrapper", "vllm.compilation.wrapper.logger", "vllm.compilation.wrapper.reset_compile_wrapper" ], "n_typable": 30, "n_typed": 11, "n_any": 13, "n_untyped": 6, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 13, "n_classes": 1, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/config/pooler.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.pooler.PoolerConfig", "methods": [ { "kind": "function", "name": "PoolerConfig.__post_init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PoolerConfig.get_seq_pooling_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PoolerConfig.get_tok_pooling_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PoolerConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolerConfig.pooling_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolerConfig.seq_pooling_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolerConfig.tok_pooling_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolerConfig.use_activation", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolerConfig.dimensions", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolerConfig.enable_chunked_processing", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolerConfig.max_embed_len", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolerConfig.logit_bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolerConfig.step_tag_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolerConfig.returned_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 14, "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 0, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.config.pooler.SEQ_POOLING_TYPES", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.pooler.TOK_POOLING_TYPES", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.pooler.SequencePoolingType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.pooler.TokenPoolingType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.pooler.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.pooler", "names": [ "vllm.config.pooler.PoolerConfig", "vllm.config.pooler.SEQ_POOLING_TYPES", "vllm.config.pooler.SequencePoolingType", "vllm.config.pooler.TOK_POOLING_TYPES", "vllm.config.pooler.TokenPoolingType", "vllm.config.pooler.logger" ], "n_typable": 19, "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 0, "n_classes": 1, "n_attrs": 15, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/config/speculative.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.speculative.SpeculativeConfig", "methods": [ { "kind": "function", "name": "SpeculativeConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpeculativeConfig.hf_config_override", "n_typed": 0, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SpeculativeConfig.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpeculativeConfig._validate_suffix_decoding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpeculativeConfig._maybe_override_draft_max_model_len", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SpeculativeConfig._verify_and_get_draft_tp", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SpeculativeConfig.update_arch_", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpeculativeConfig.create_draft_parallel_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SpeculativeConfig._verify_args", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpeculativeConfig.verify_equal_vocab_size_if_draft_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpeculativeConfig.use_eagle", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpeculativeConfig.uses_draft_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpeculativeConfig.uses_extract_hidden_states", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpeculativeConfig.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "SpeculativeConfig.max_num_new_slots_for_drafting", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "SpeculativeConfig.enforce_eager", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.num_speculative_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.method", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.draft_tensor_parallel_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.tensor_parallel_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.quantization", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.max_model_len", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.revision", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.code_revision", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.disable_padded_drafter_batch", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.use_local_argmax_reduction", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.prompt_lookup_max", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.prompt_lookup_min", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.speculative_token_tree", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.parallel_drafting", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.target_model_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.target_parallel_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.draft_model_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.draft_parallel_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.suffix_decoding_max_tree_depth", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.suffix_decoding_max_cached_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.suffix_decoding_max_spec_factor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.suffix_decoding_min_token_prob", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeculativeConfig.draft_load_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 49, "n_typed": 42, "n_any": 3, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 9, "n_attrs": 25, "n_properties": 1 }, { "kind": "attr", "name": "vllm.config.speculative.EagleModelTypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.speculative.me_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.speculative.MTPModelTypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.speculative.SpeculativeMethod", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.speculative.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null } ], "name": "vllm.config.speculative", "names": [ "vllm.config.speculative.EagleModelTypes", "vllm.config.speculative.MTPModelTypes", "vllm.config.speculative.SpeculativeConfig", "vllm.config.speculative.SpeculativeMethod", "vllm.config.speculative.logger", "vllm.config.speculative.me_quant" ], "n_typable": 54, "n_typed": 45, "n_any": 3, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 9, "n_classes": 1, "n_attrs": 30, "n_properties": 1, "n_type_ignores": 4 }, { "path": "vllm/config/vllm.py", "symbol_reports": [ { "kind": "function", "name": "vllm.config.vllm.get_current_vllm_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.config.vllm.get_layers_from_vllm_config", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.config.vllm.get_cached_compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.config.vllm.VllmConfig", "methods": [ { "kind": "function", "name": "VllmConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VllmConfig.enable_trace_function_call_for_thread", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VllmConfig._get_quantization_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmConfig.get_quantization_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmConfig.with_hf_config", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmConfig._set_config_default", "n_typed": 2, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VllmConfig._apply_optimization_level_defaults", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VllmConfig._post_init_kv_transfer_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VllmConfig.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VllmConfig.update_sizes_for_sequence_parallelism", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VllmConfig._set_max_num_scheduled_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VllmConfig._set_cudagraph_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VllmConfig._set_compile_ranges", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VllmConfig.try_verify_and_update_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VllmConfig.compile_debug_dump_path", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VllmConfig.__str__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VllmConfig.validate_mamba_block_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "VllmConfig.num_speculative_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VllmConfig.needs_dp_coordinator", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "VllmConfig.model_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.cache_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.parallel_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.scheduler_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.device_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.load_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.offload_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.attention_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.kernel_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.lora_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.speculative_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.structured_outputs_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.observability_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.quant_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.compilation_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.profiler_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.kv_transfer_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.kv_events_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.ec_transfer_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.additional_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.instance_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.optimization_level", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.performance_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VllmConfig.weight_transfer_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 54, "n_typed": 45, "n_any": 3, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 11, "n_attrs": 24, "n_properties": 2 }, { "kind": "function", "name": "vllm.config.vllm.get_current_vllm_config_or_none", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.config.vllm.set_current_vllm_config", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.config.vllm.OptimizationLevel", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "OptimizationLevel.O0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OptimizationLevel.O1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OptimizationLevel.O2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OptimizationLevel.O3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.config.vllm.OPTIMIZATION_LEVEL_03", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.config.vllm.enable_norm_pad_fusion", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.config.vllm.IS_DENSE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.config.vllm.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.vllm.OPTIMIZATION_LEVEL_02", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.config.vllm.OPTIMIZATION_LEVEL_00", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.config.vllm.enable_norm_fusion", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.config.vllm.OPTIMIZATION_LEVEL_TO_CONFIG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.config.vllm.OPTIMIZATION_LEVEL_01", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.config.vllm.T", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.config.vllm.PerformanceMode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.config.vllm.enable_allreduce_rms_fusion", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.config.vllm.enable_act_fusion", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.config.vllm.IS_QUANTIZED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.config.vllm.enable_rope_kvcache_fusion", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.config.vllm", "names": [ "vllm.config.vllm.IS_DENSE", "vllm.config.vllm.IS_QUANTIZED", "vllm.config.vllm.OPTIMIZATION_LEVEL_00", "vllm.config.vllm.OPTIMIZATION_LEVEL_01", "vllm.config.vllm.OPTIMIZATION_LEVEL_02", "vllm.config.vllm.OPTIMIZATION_LEVEL_03", "vllm.config.vllm.OPTIMIZATION_LEVEL_TO_CONFIG", "vllm.config.vllm.OptimizationLevel", "vllm.config.vllm.PerformanceMode", "vllm.config.vllm.T", "vllm.config.vllm.VllmConfig", "vllm.config.vllm.enable_act_fusion", "vllm.config.vllm.enable_allreduce_rms_fusion", "vllm.config.vllm.enable_norm_fusion", "vllm.config.vllm.enable_norm_pad_fusion", "vllm.config.vllm.enable_rope_kvcache_fusion", "vllm.config.vllm.get_cached_compilation_config", "vllm.config.vllm.get_current_vllm_config", "vllm.config.vllm.get_current_vllm_config_or_none", "vllm.config.vllm.get_layers_from_vllm_config", "vllm.config.vllm.logger", "vllm.config.vllm.set_current_vllm_config" ], "n_typable": 77, "n_typed": 64, "n_any": 3, "n_untyped": 10, "n_functions": 10, "n_function_overloads": 10, "n_function_params": 11, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 11, "n_classes": 2, "n_attrs": 38, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/config/ec_transfer.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.ec_transfer.ECTransferConfig", "methods": [ { "kind": "function", "name": "ECTransferConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ECTransferConfig.__post_init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ECTransferConfig.get_from_extra_config", "n_typed": 0, "n_any": 1, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "ECTransferConfig.is_ec_transfer_instance", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ECTransferConfig.is_ec_producer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ECTransferConfig.is_ec_consumer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ECTransferConfig.ec_connector", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ECTransferConfig.engine_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ECTransferConfig.ec_buffer_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ECTransferConfig.ec_buffer_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ECTransferConfig.ec_role", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ECTransferConfig.ec_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ECTransferConfig.ec_parallel_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ECTransferConfig.ec_ip", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ECTransferConfig.ec_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ECTransferConfig.ec_connector_extra_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ECTransferConfig.ec_connector_module_path", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 19, "n_typed": 16, "n_any": 1, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 11, "n_properties": 3 }, { "kind": "attr", "name": "vllm.config.ec_transfer.ECRole", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.ec_transfer.ECConsumer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.ec_transfer.ECProducer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.ec_transfer", "names": [ "vllm.config.ec_transfer.ECConsumer", "vllm.config.ec_transfer.ECProducer", "vllm.config.ec_transfer.ECRole", "vllm.config.ec_transfer.ECTransferConfig" ], "n_typable": 22, "n_typed": 19, "n_any": 1, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_classes": 1, "n_attrs": 14, "n_properties": 3, "n_type_ignores": 0 }, { "path": "vllm/config/compilation.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.compilation.CompilationConfig", "methods": [ { "kind": "function", "name": "CompilationConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompilationConfig.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompilationConfig.__str__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompilationConfig.validate_mode_before", "n_typed": 0, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompilationConfig.validate_cudagraph_mode_before", "n_typed": 0, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompilationConfig.validate_pass_config_before", "n_typed": 0, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompilationConfig.validate_compile_cache_save_format", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompilationConfig._skip_none_validation", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CompilationConfig.__post_init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompilationConfig.init_backend", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompilationConfig.post_init_cudagraph_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompilationConfig.set_splitting_ops_for_v1", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CompilationConfig.set_splitting_ops_for_attn_fusion", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompilationConfig.splitting_ops_contain_attention", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompilationConfig.is_attention_compiled_piecewise", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompilationConfig.custom_op_log_check", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompilationConfig.is_custom_op_enabled", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompilationConfig.adjust_cudagraph_sizes_for_spec_decode", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CompilationConfig.get_compile_ranges", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompilationConfig.level", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.debug_dump_path", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.cache_dir", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.compile_cache_save_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.custom_ops", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.splitting_ops", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.compile_mm_encoder", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.compile_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.compile_ranges_split_points", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.inductor_compile_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.inductor_passes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.cudagraph_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.cudagraph_num_of_warmups", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.cudagraph_capture_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.cudagraph_copy_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.cudagraph_specialize_lora", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.use_inductor_graph_partition", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.pass_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.max_cudagraph_capture_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.dynamic_shapes_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.local_cache_dir", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.fast_moe_cold_start", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.enabled_custom_ops", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.disabled_custom_ops", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.traced_files", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.compilation_time", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.static_forward_context", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig.static_all_moe_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompilationConfig._attention_ops", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 62, "n_typed": 50, "n_any": 8, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 12, "n_attrs": 31, "n_properties": 0 }, { "kind": "class", "name": "vllm.config.compilation.CUDAGraphMode", "methods": [ { "kind": "function", "name": "CUDAGraphMode.decode_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CUDAGraphMode.mixed_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CUDAGraphMode.has_mode", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CUDAGraphMode.requires_piecewise_compilation", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CUDAGraphMode.max_cudagraph_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CUDAGraphMode.has_full_cudagraphs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CUDAGraphMode.has_piecewise_cudagraphs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CUDAGraphMode.separate_routine", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CUDAGraphMode.valid_runtime_modes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CUDAGraphMode.is_valid_runtime_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CUDAGraphMode.__str__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CUDAGraphMode.NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CUDAGraphMode.PIECEWISE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CUDAGraphMode.FULL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CUDAGraphMode.FULL_DECODE_ONLY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CUDAGraphMode.FULL_AND_PIECEWISE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 1, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.config.compilation.PassConfig", "methods": [ { "kind": "function", "name": "PassConfig.flashinfer_max_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PassConfig.default_fi_allreduce_fusion_max_size_mb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PassConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PassConfig._skip_none_validation", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PassConfig.__post_init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PassConfig.fuse_norm_quant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PassConfig.fuse_act_quant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PassConfig.fuse_attn_quant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PassConfig.eliminate_noops", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PassConfig.enable_sp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PassConfig.fuse_gemm_comms", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PassConfig.fuse_allreduce_rms", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PassConfig.enable_qk_norm_rope_fusion", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PassConfig.fuse_act_padding", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PassConfig.fuse_rope_kvcache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PassConfig.rope_kvcache_fusion_max_token_num", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PassConfig.fi_allreduce_fusion_max_size_mb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PassConfig.sp_min_token_num", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 21, "n_typed": 19, "n_any": 2, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 3, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.config.compilation.CompilationMode", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CompilationMode.NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompilationMode.STOCK_TORCH_COMPILE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompilationMode.DYNAMO_TRACE_ONCE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CompilationMode.VLLM_COMPILE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.config.compilation.DynamicShapesConfig", "methods": [ { "kind": "function", "name": "DynamicShapesConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DynamicShapesConfig.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DynamicShapesConfig.evaluate_guards", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DynamicShapesConfig.assume_32_bit_indexing", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.config.compilation.VllmConfig", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.config.compilation.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.config.compilation.DynamicShapesType", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DynamicShapesType.BACKED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DynamicShapesType.UNBACKED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DynamicShapesType.BACKED_SIZE_OBLIVIOUS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": null } ], "name": "vllm.config.compilation", "names": [ "vllm.config.compilation.CUDAGraphMode", "vllm.config.compilation.CompilationConfig", "vllm.config.compilation.CompilationMode", "vllm.config.compilation.DynamicShapesConfig", "vllm.config.compilation.DynamicShapesType", "vllm.config.compilation.PassConfig", "vllm.config.compilation.VllmConfig", "vllm.config.compilation.logger" ], "n_typable": 100, "n_typed": 85, "n_any": 10, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 36, "n_method_overloads": 36, "n_method_params": 16, "n_classes": 6, "n_attrs": 61, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/config/model.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.model.ModelConfig", "methods": [ { "kind": "function", "name": "ModelConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig._update_nested", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelConfig._apply_dict_overrides", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelConfig.__post_init__", "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "ModelConfig.get_model_arch_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig._skip_none_validation", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelConfig._lowercase_tokenizer_mode", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelConfig.validate_quantization_before", "n_typed": 0, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelConfig.validate_model_config_after", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig._get_transformers_backend_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig.using_transformers_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig.maybe_pull_model_tokenizer_for_runai", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelConfig._get_encoder_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig._get_default_runner_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelConfig._get_runner_type", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelConfig._get_default_convert_type", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelConfig._get_convert_type", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ModelConfig._verify_quantization", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig._verify_cuda_graph", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig._verify_bnb_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig._verify_with_expert_parallelism", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig._try_verify_and_update_model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig.verify_dual_chunk_attention_config", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelConfig.verify_with_parallel_config", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelConfig.get_sliding_window", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig.get_vocab_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig.get_hidden_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig.get_inputs_embeds_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig.get_head_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig.get_total_num_kv_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig.get_num_kv_heads", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelConfig.get_num_attention_heads", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelConfig.get_num_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig.get_total_num_hidden_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig.get_layers_start_end_indices", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelConfig.get_num_layers", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelConfig.get_num_layers_by_block_type", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelConfig.get_mamba_chunk_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig.get_multimodal_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig.try_get_generation_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig.get_diff_sampling_param", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelConfig.get_and_verify_max_len", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelConfig.is_nvfp4_quantized", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "ModelConfig.registry", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.architectures", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.architecture", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.is_deepseek_mla", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.is_mm_prefix_lm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.is_encoder_decoder", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.uses_alibi", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.uses_mrope", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.uses_xdrope_dim", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.is_multimodal_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.is_multimodal_raw_input_only_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.requires_raw_input_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.is_cross_encoder", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.is_late_interaction", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.is_pp_supported", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.is_attention_free", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.is_hybrid", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.has_noops", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.has_inner_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.supports_mamba_prefix_caching", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.use_mla", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.is_matryoshka", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.matryoshka_dimensions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.use_sep_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.head_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.embedding_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.attn_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.is_chunked_prefill_supported", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.is_prefix_caching_supported", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.is_moe", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ModelConfig.is_quantized", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ModelConfig.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.model_weights", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.runner", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.convert", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.tokenizer_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.trust_remote_code", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.seed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.hf_config", "n_typed": 0, "n_any": 1, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.hf_text_config", "n_typed": 0, "n_any": 1, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.hf_config_path", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.allowed_local_media_path", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.allowed_media_domains", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.revision", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.code_revision", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.tokenizer_revision", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.max_model_len", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.spec_target_max_model_len", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.quantization", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.allow_deprecated_quantization", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.enforce_eager", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.enable_return_routed_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.max_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.logprobs_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.disable_sliding_window", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.disable_cascade_attn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.skip_tokenizer_init", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.enable_prompt_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.served_model_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.config_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.hf_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.hf_overrides", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.generation_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.override_generation_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.enable_sleep_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.model_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.override_attention_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.logits_processors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.io_processor_plugin", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.pooler_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.multimodal_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.language_model_only", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.limit_mm_per_prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.enable_mm_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.media_io_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.mm_processor_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.mm_processor_cache_gb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.mm_processor_cache_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.mm_shm_cache_max_object_size_mb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.mm_encoder_only", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.mm_encoder_tp_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.mm_encoder_attn_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.interleave_mm_strings", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.skip_mm_profiling", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.video_pruning_rate", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.attention_chunk_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.encoder_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.hf_image_processor_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.model_arch_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.runner_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.convert_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.original_max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelConfig.config_updated", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 179, "n_typed": 151, "n_any": 14, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 43, "n_method_overloads": 43, "n_method_params": 41, "n_attrs": 64, "n_properties": 31 }, { "kind": "function", "name": "vllm.config.model.iter_architecture_defaults", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.config.model.try_match_architecture_defaults", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.config.model.str_dtype_to_torch_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.config.model.me_models", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.config.model.get_served_model_name", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.config.model.RunnerOption", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.model.ConvertType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.model.ModelImpl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.model.me_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.model.ConvertOption", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.model.TokenizerMode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.model.AttnTypeStr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.model.LayerBlockType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.model.LogprobsMode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.model.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.model.HfOverrides", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.config.model.ModelDType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.model", "names": [ "vllm.config.model.AttnTypeStr", "vllm.config.model.ConvertOption", "vllm.config.model.ConvertType", "vllm.config.model.HfOverrides", "vllm.config.model.LayerBlockType", "vllm.config.model.LogprobsMode", "vllm.config.model.ModelConfig", "vllm.config.model.ModelDType", "vllm.config.model.ModelImpl", "vllm.config.model.RunnerOption", "vllm.config.model.TokenizerMode", "vllm.config.model.get_served_model_name", "vllm.config.model.iter_architecture_defaults", "vllm.config.model.logger", "vllm.config.model.me_models", "vllm.config.model.me_quant", "vllm.config.model.str_dtype_to_torch_dtype", "vllm.config.model.try_match_architecture_defaults" ], "n_typable": 201, "n_typed": 167, "n_any": 14, "n_untyped": 20, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 6, "n_methods": 43, "n_method_overloads": 43, "n_method_params": 41, "n_classes": 1, "n_attrs": 77, "n_properties": 31, "n_type_ignores": 0 }, { "path": "vllm/config/device.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.device.DeviceConfig", "methods": [ { "kind": "function", "name": "DeviceConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeviceConfig.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeviceConfig.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeviceConfig.device_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.config.device.Device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.device", "names": [ "vllm.config.device.Device", "vllm.config.device.DeviceConfig" ], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/config/multimodal.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.multimodal.MultiModalConfig", "methods": [ { "kind": "function", "name": "MultiModalConfig._validate_limit_per_prompt", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalConfig._validate_mm_encoder_attn_backend", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalConfig._validate_multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiModalConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiModalConfig.get_limit_per_prompt", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalConfig.merge_mm_processor_kwargs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalConfig.is_multimodal_pruning_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalConfig.language_model_only", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalConfig.limit_per_prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalConfig.enable_mm_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalConfig.media_io_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalConfig.mm_processor_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalConfig.mm_processor_cache_gb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalConfig.mm_processor_cache_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalConfig.mm_shm_cache_max_object_size_mb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalConfig.mm_encoder_only", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalConfig.mm_encoder_tp_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalConfig.mm_encoder_attn_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalConfig.interleave_mm_strings", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalConfig.skip_mm_profiling", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalConfig.video_pruning_rate", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 25, "n_typed": 23, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 4, "n_attrs": 14, "n_properties": 0 }, { "kind": "attr", "name": "vllm.config.multimodal.MMEncoderTPMode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.multimodal.MMDummyOptions", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.config.multimodal.ImageDummyOptions", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ImageDummyOptions.width", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ImageDummyOptions.height", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.config.multimodal.BaseDummyOptions", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseDummyOptions.count", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.config.multimodal.VideoDummyOptions", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "VideoDummyOptions.num_frames", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VideoDummyOptions.width", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VideoDummyOptions.height", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.config.multimodal.AudioDummyOptions", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AudioDummyOptions.length", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.config.multimodal.MultiModalDummyOptionsBuiltins", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalDummyOptionsBuiltins.image", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModalDummyOptionsBuiltins.video", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModalDummyOptionsBuiltins.audio", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.config.multimodal.MMCacheType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.multimodal", "names": [ "vllm.config.multimodal.AudioDummyOptions", "vllm.config.multimodal.BaseDummyOptions", "vllm.config.multimodal.ImageDummyOptions", "vllm.config.multimodal.MMCacheType", "vllm.config.multimodal.MMDummyOptions", "vllm.config.multimodal.MMEncoderTPMode", "vllm.config.multimodal.MultiModalConfig", "vllm.config.multimodal.MultiModalDummyOptionsBuiltins", "vllm.config.multimodal.VideoDummyOptions" ], "n_typable": 28, "n_typed": 26, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 4, "n_classes": 6, "n_attrs": 27, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/config/speech_to_text.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.speech_to_text.SpeechToTextConfig", "methods": [], "properties": [ { "kind": "property", "name": "SpeechToTextConfig.allow_audio_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "SpeechToTextConfig.sample_rate", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeechToTextConfig.max_audio_clip_s", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeechToTextConfig.overlap_chunk_second", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpeechToTextConfig.min_energy_split_window_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.config.speech_to_text", "names": [ "vllm.config.speech_to_text.SpeechToTextConfig" ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 4, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/config/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.config.utils.update_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.config.utils.ConfigType", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.config.utils.get_attr_docs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.config.utils.config", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.config.utils.is_init_field", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.config.utils.replace", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.config.utils.SupportsMetricsInfo", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.config.utils.SupportsHash", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.config.utils.hash_factors", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.config.utils.get_hash_factors", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.config.utils.normalize_value", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.config.utils.ConfigT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.config.utils.handle_deprecated", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.config.utils.set_from_deprecated_env_if_set", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.config.utils.get_from_deprecated_env_if_set", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.config.utils.get_field", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.config.utils.Range", "methods": [ { "kind": "function", "name": "Range.is_single_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Range.__contains__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Range.__eq__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Range.__hash__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Range.__str__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Range.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Range.start", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Range.end", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.config.utils.getattr_iter", "n_typed": 5, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.config.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.utils", "names": [ "vllm.config.utils.ConfigT", "vllm.config.utils.ConfigType", "vllm.config.utils.Range", "vllm.config.utils.SupportsHash", "vllm.config.utils.SupportsMetricsInfo", "vllm.config.utils.config", "vllm.config.utils.get_attr_docs", "vllm.config.utils.get_field", "vllm.config.utils.get_from_deprecated_env_if_set", "vllm.config.utils.get_hash_factors", "vllm.config.utils.getattr_iter", "vllm.config.utils.handle_deprecated", "vllm.config.utils.hash_factors", "vllm.config.utils.is_init_field", "vllm.config.utils.logger", "vllm.config.utils.normalize_value", "vllm.config.utils.replace", "vllm.config.utils.set_from_deprecated_env_if_set", "vllm.config.utils.update_config" ], "n_typable": 56, "n_typed": 49, "n_any": 3, "n_untyped": 4, "n_functions": 13, "n_function_overloads": 13, "n_function_params": 34, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 2, "n_classes": 3, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/config/load.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.load.LoadConfig", "methods": [ { "kind": "function", "name": "LoadConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoadConfig._lowercase_load_format", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoadConfig._validate_ignore_patterns", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LoadConfig.load_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoadConfig.download_dir", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoadConfig.safetensors_load_strategy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoadConfig.model_loader_extra_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoadConfig.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoadConfig.ignore_patterns", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoadConfig.use_tqdm_on_load", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoadConfig.pt_load_map_location", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 13, "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.config.load.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.load", "names": [ "vllm.config.load.LoadConfig", "vllm.config.load.logger" ], "n_typable": 14, "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_classes": 1, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/config/kv_events.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.kv_events.KVEventsConfig", "methods": [ { "kind": "function", "name": "KVEventsConfig.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KVEventsConfig.enable_kv_cache_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVEventsConfig.publisher", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVEventsConfig.endpoint", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVEventsConfig.replay_endpoint", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVEventsConfig.buffer_steps", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVEventsConfig.hwm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVEventsConfig.max_queue_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVEventsConfig.topic", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.config.kv_events", "names": [ "vllm.config.kv_events.KVEventsConfig" ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_classes": 1, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/config/offload.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.offload.UVAOffloadConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "UVAOffloadConfig.cpu_offload_gb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UVAOffloadConfig.cpu_offload_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.config.offload.PrefetchOffloadConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PrefetchOffloadConfig.offload_group_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PrefetchOffloadConfig.offload_num_in_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PrefetchOffloadConfig.offload_prefetch_step", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PrefetchOffloadConfig.offload_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.config.offload.OffloadConfig", "methods": [ { "kind": "function", "name": "OffloadConfig.validate_offload_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OffloadConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OffloadConfig.offload_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OffloadConfig.uva", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OffloadConfig.prefetch", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.config.offload.OffloadBackend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.offload", "names": [ "vllm.config.offload.OffloadBackend", "vllm.config.offload.OffloadConfig", "vllm.config.offload.PrefetchOffloadConfig", "vllm.config.offload.UVAOffloadConfig" ], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_classes": 3, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/config/kernel.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.kernel.KernelConfig", "methods": [ { "kind": "function", "name": "KernelConfig._normalize_moe_backend", "n_typed": 0, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KernelConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KernelConfig._skip_none_validation", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KernelConfig.enable_flashinfer_autotune", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KernelConfig.moe_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 8, "n_typed": 4, "n_any": 4, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.config.kernel.MoEBackend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.kernel", "names": [ "vllm.config.kernel.KernelConfig", "vllm.config.kernel.MoEBackend" ], "n_typable": 9, "n_typed": 5, "n_any": 4, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/config/structured_outputs.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.structured_outputs.StructuredOutputsConfig", "methods": [ { "kind": "function", "name": "StructuredOutputsConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StructuredOutputsConfig._validate_structured_output_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StructuredOutputsConfig.backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputsConfig.disable_fallback", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputsConfig.disable_any_whitespace", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputsConfig.disable_additional_properties", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputsConfig.reasoning_parser", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputsConfig.reasoning_parser_plugin", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputsConfig.enable_in_reasoning", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.config.structured_outputs.StructuredOutputsBackend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.structured_outputs", "names": [ "vllm.config.structured_outputs.StructuredOutputsBackend", "vllm.config.structured_outputs.StructuredOutputsConfig" ], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_classes": 1, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/config/kv_transfer.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.kv_transfer.KVTransferConfig", "methods": [ { "kind": "function", "name": "KVTransferConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVTransferConfig.__post_init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVTransferConfig.get_from_extra_config", "n_typed": 0, "n_any": 1, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "KVTransferConfig.is_kv_transfer_instance", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "KVTransferConfig.is_kv_producer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "KVTransferConfig.is_kv_consumer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "KVTransferConfig.kv_connector", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVTransferConfig.engine_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVTransferConfig.kv_buffer_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVTransferConfig.kv_buffer_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVTransferConfig.kv_role", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVTransferConfig.kv_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVTransferConfig.kv_parallel_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVTransferConfig.kv_ip", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVTransferConfig.kv_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVTransferConfig.kv_connector_extra_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVTransferConfig.kv_connector_module_path", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVTransferConfig.enable_permute_local_kv", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVTransferConfig.kv_load_failure_policy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 21, "n_typed": 18, "n_any": 1, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 13, "n_properties": 3 }, { "kind": "attr", "name": "vllm.config.kv_transfer.KVProducer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.kv_transfer.KVConsumer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.kv_transfer.KVRole", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.kv_transfer", "names": [ "vllm.config.kv_transfer.KVConsumer", "vllm.config.kv_transfer.KVProducer", "vllm.config.kv_transfer.KVRole", "vllm.config.kv_transfer.KVTransferConfig" ], "n_typable": 24, "n_typed": 21, "n_any": 1, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_classes": 1, "n_attrs": 16, "n_properties": 3, "n_type_ignores": 0 }, { "path": "vllm/config/profiler.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.profiler.ProfilerConfig", "methods": [ { "kind": "function", "name": "ProfilerConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ProfilerConfig._validate_profiler_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ProfilerConfig.profiler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ProfilerConfig.torch_profiler_dir", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ProfilerConfig.torch_profiler_with_stack", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ProfilerConfig.torch_profiler_with_flops", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ProfilerConfig.torch_profiler_use_gzip", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ProfilerConfig.torch_profiler_dump_cuda_time_total", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ProfilerConfig.torch_profiler_record_shapes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ProfilerConfig.torch_profiler_with_memory", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ProfilerConfig.ignore_frontend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ProfilerConfig.delay_iterations", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ProfilerConfig.max_iterations", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 13, "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 11, "n_properties": 0 }, { "kind": "attr", "name": "vllm.config.profiler.ProfilerKind", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.profiler.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.profiler", "names": [ "vllm.config.profiler.ProfilerConfig", "vllm.config.profiler.ProfilerKind", "vllm.config.profiler.logger" ], "n_typable": 15, "n_typed": 14, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_classes": 1, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/config/parallel.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.parallel.ParallelConfig", "methods": [ { "kind": "function", "name": "ParallelConfig._skip_none_validation", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ParallelConfig._validate_parallel_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParallelConfig.get_next_dp_init_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParallelConfig.allocate_elastic_ep_ports", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParallelConfig.get_next_stateless_world_group_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParallelConfig.get_next_stateless_dp_group_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParallelConfig.get_next_stateless_ep_group_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParallelConfig.get_next_stateless_eplb_group_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParallelConfig.stateless_init_dp_group", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParallelConfig.has_unfinished_dp", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ParallelConfig.sync_kv_cache_memory_size", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ParallelConfig.compute_hash", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParallelConfig.__post_init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParallelConfig._verify_args", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "ParallelConfig.world_size_across_dp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ParallelConfig.use_ubatching", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ParallelConfig.num_ubatches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ParallelConfig.local_engines_only", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ParallelConfig.use_sequence_parallel_moe", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ParallelConfig.node_rank_within_dp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ParallelConfig.nnodes_within_dp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ParallelConfig.local_world_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ParallelConfig.use_ray", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ParallelConfig.pipeline_parallel_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.tensor_parallel_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.prefill_context_parallel_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.data_parallel_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.data_parallel_size_local", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.data_parallel_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.data_parallel_rank_local", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.data_parallel_master_ip", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.data_parallel_rpc_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.data_parallel_master_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.data_parallel_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.data_parallel_external_lb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.data_parallel_hybrid_lb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.is_moe_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.enable_expert_parallel", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.enable_eplb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.eplb_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.expert_placement_strategy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.all2all_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.max_parallel_loading_workers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.disable_custom_all_reduce", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.enable_elastic_ep", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.enable_dbo", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.ubatch_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.dbo_decode_token_threshold", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.dbo_prefill_token_threshold", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.disable_nccl_for_dp_synchronization", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.ray_workers_use_nsight", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.ray_runtime_env", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.placement_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.distributed_executor_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.worker_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.sd_worker_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.worker_extension_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.master_addr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.master_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.node_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.nnodes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.world_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig._data_parallel_master_port_list", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig._stateless_dp_group_port_list", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig._stateless_ep_group_port_list", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig._stateless_eplb_group_port_list", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig._stateless_world_group_port_list", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.decode_context_parallel_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.dcp_kv_cache_interleave_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.cp_kv_cache_interleave_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig.data_parallel_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig._api_process_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParallelConfig._api_process_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 81, "n_typed": 78, "n_any": 2, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 7, "n_attrs": 51, "n_properties": 9 }, { "kind": "class", "name": "vllm.config.parallel.EPLBConfig", "methods": [ { "kind": "function", "name": "EPLBConfig._validate_eplb_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EPLBConfig.window_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EPLBConfig.step_interval", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EPLBConfig.num_redundant_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EPLBConfig.log_balancedness", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EPLBConfig.log_balancedness_interval", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EPLBConfig.use_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EPLBConfig.policy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.config.parallel.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.parallel.All2AllBackend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.parallel.ExpertPlacementStrategy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.parallel.DistributedExecutorBackend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.parallel.DataParallelBackend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.parallel.EPLBPolicyOption", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.parallel", "names": [ "vllm.config.parallel.All2AllBackend", "vllm.config.parallel.DataParallelBackend", "vllm.config.parallel.DistributedExecutorBackend", "vllm.config.parallel.EPLBConfig", "vllm.config.parallel.EPLBPolicyOption", "vllm.config.parallel.ExpertPlacementStrategy", "vllm.config.parallel.ParallelConfig", "vllm.config.parallel.logger" ], "n_typable": 95, "n_typed": 91, "n_any": 2, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 7, "n_classes": 2, "n_attrs": 64, "n_properties": 9, "n_type_ignores": 0 }, { "path": "vllm/config/attention.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.attention.AttentionConfig", "methods": [ { "kind": "function", "name": "AttentionConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionConfig.validate_backend_before", "n_typed": 0, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AttentionConfig.backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionConfig.flash_attn_version", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionConfig.use_prefill_decode_attention", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionConfig.flash_attn_max_num_splits_for_cuda_graph", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionConfig.use_cudnn_prefill", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionConfig.use_trtllm_ragged_deepseek_prefill", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionConfig.use_trtllm_attention", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionConfig.disable_flashinfer_prefill", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionConfig.disable_flashinfer_q_quantization", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionConfig.use_prefill_query_quantization", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 13, "n_typed": 11, "n_any": 2, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.config.attention", "names": [ "vllm.config.attention.AttentionConfig" ], "n_typable": 13, "n_typed": 11, "n_any": 2, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_classes": 1, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/config/observability.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.observability.ObservabilityConfig", "methods": [ { "kind": "function", "name": "ObservabilityConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ObservabilityConfig._validate_show_hidden_metrics_for_version", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ObservabilityConfig._validate_otlp_traces_endpoint", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ObservabilityConfig._validate_collect_detailed_traces", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ObservabilityConfig._validate_tracing_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "ObservabilityConfig.show_hidden_metrics", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ObservabilityConfig.collect_model_forward_time", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ObservabilityConfig.collect_model_execute_time", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ObservabilityConfig.show_hidden_metrics_for_version", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ObservabilityConfig.otlp_traces_endpoint", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ObservabilityConfig.collect_detailed_traces", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ObservabilityConfig.kv_cache_metrics", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ObservabilityConfig.kv_cache_metrics_sample", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ObservabilityConfig.cudagraph_metrics", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ObservabilityConfig.enable_layerwise_nvtx_tracing", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ObservabilityConfig.enable_mfu_metrics", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ObservabilityConfig.enable_mm_processor_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ObservabilityConfig.enable_logging_iteration_details", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 21, "n_typed": 20, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 3, "n_attrs": 10, "n_properties": 3 }, { "kind": "attr", "name": "vllm.config.observability.DetailedTraceModules", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.observability", "names": [ "vllm.config.observability.DetailedTraceModules", "vllm.config.observability.ObservabilityConfig" ], "n_typable": 22, "n_typed": 21, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 3, "n_classes": 1, "n_attrs": 11, "n_properties": 3, "n_type_ignores": 0 }, { "path": "vllm/config/scheduler.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.scheduler.SchedulerConfig", "methods": [ { "kind": "function", "name": "SchedulerConfig.default_factory", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SchedulerConfig.get_scheduler_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SchedulerConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SchedulerConfig._skip_none_validation", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SchedulerConfig.__post_init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SchedulerConfig.verify_max_model_len", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SchedulerConfig.max_model_len", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.is_encoder_decoder", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.DEFAULT_MAX_NUM_BATCHED_TOKENS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.DEFAULT_MAX_NUM_SEQS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.runner_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.max_num_batched_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.max_num_scheduled_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.max_num_seqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.max_num_partial_prefills", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.max_long_partial_prefills", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.long_prefill_token_threshold", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.enable_chunked_prefill", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.is_multimodal_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.max_num_encoder_input_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.encoder_cache_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.policy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.disable_chunked_mm_input", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.scheduler_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.disable_hybrid_kv_cache_manager", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.async_scheduling", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SchedulerConfig.stream_interval", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 33, "n_typed": 29, "n_any": 2, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_attrs": 21, "n_properties": 0 }, { "kind": "attr", "name": "vllm.config.scheduler.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.scheduler.RunnerType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.scheduler.SchedulerPolicy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.scheduler", "names": [ "vllm.config.scheduler.RunnerType", "vllm.config.scheduler.SchedulerConfig", "vllm.config.scheduler.SchedulerPolicy", "vllm.config.scheduler.logger" ], "n_typable": 36, "n_typed": 31, "n_any": 2, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_classes": 1, "n_attrs": 24, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/config/weight_transfer.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.weight_transfer.WeightTransferConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "WeightTransferConfig.backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.config.weight_transfer", "names": [ "vllm.config.weight_transfer.WeightTransferConfig" ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/config/cache.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.cache.CacheConfig", "methods": [ { "kind": "function", "name": "CacheConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CacheConfig.metrics_info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CacheConfig._validate_cache_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CacheConfig.verify_with_parallel_config", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CacheConfig.block_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.gpu_memory_utilization", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.swap_space", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.cache_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.is_attention_free", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.num_gpu_blocks_override", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.sliding_window", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.enable_prefix_caching", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.prefix_caching_hash_algo", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.cpu_offload_gb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.cpu_offload_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.calculate_kv_scales", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.cpu_kvcache_space_bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.mamba_page_size_padded", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.mamba_block_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.mamba_cache_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.mamba_ssm_cache_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.mamba_cache_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.num_gpu_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.num_cpu_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.kv_sharing_fast_prefill", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.kv_cache_memory_bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.kv_offloading_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheConfig.kv_offloading_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 30, "n_typed": 28, "n_any": 1, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_attrs": 24, "n_properties": 0 }, { "kind": "attr", "name": "vllm.config.cache.MambaCacheMode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.cache.BlockSize", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.cache.KVOffloadingBackend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.cache.CacheDType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.cache.MambaDType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.cache.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.cache.PrefixCachingHashAlgo", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": [ "assignment" ] } ], "name": "vllm.config.cache", "names": [ "vllm.config.cache.BlockSize", "vllm.config.cache.CacheConfig", "vllm.config.cache.CacheDType", "vllm.config.cache.KVOffloadingBackend", "vllm.config.cache.MambaCacheMode", "vllm.config.cache.MambaDType", "vllm.config.cache.PrefixCachingHashAlgo", "vllm.config.cache.logger" ], "n_typable": 37, "n_typed": 34, "n_any": 1, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_classes": 1, "n_attrs": 31, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/config/lora.py", "symbol_reports": [ { "kind": "class", "name": "vllm.config.lora.LoRAConfig", "methods": [ { "kind": "function", "name": "LoRAConfig.compute_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoRAConfig._validate_lora_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoRAConfig.verify_with_model_config", "n_typed": 0, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LoRAConfig.max_lora_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRAConfig.max_loras", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRAConfig.fully_sharded_loras", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRAConfig.max_cpu_loras", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRAConfig.lora_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRAConfig.default_mm_loras", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRAConfig.enable_tower_connector_lora", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRAConfig.specialize_active_lora", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 12, "n_typed": 10, "n_any": 1, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.config.lora.LoRAExtraVocabSize", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.lora.LoRADType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.lora.MaxLoRARanks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.config.lora.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.config.lora", "names": [ "vllm.config.lora.LoRAConfig", "vllm.config.lora.LoRADType", "vllm.config.lora.LoRAExtraVocabSize", "vllm.config.lora.MaxLoRARanks", "vllm.config.lora.logger" ], "n_typable": 16, "n_typed": 13, "n_any": 1, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_classes": 1, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/config/model_arch.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.config.model_arch.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.config.model_arch.ModelArchitectureConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelArchitectureConfig.architectures", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelArchitectureConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelArchitectureConfig.text_model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelArchitectureConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelArchitectureConfig.total_num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelArchitectureConfig.total_num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelArchitectureConfig.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelArchitectureConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelArchitectureConfig.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelArchitectureConfig.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelArchitectureConfig.quantization_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelArchitectureConfig.is_deepseek_mla", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelArchitectureConfig.derived_max_model_len_and_key", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 13, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.config.model_arch", "names": [ "vllm.config.model_arch.ModelArchitectureConfig", "vllm.config.model_arch.logger" ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 14, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/connections.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.connections.global_http_connection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.connections.HTTPConnection", "methods": [ { "kind": "function", "name": "HTTPConnection.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HTTPConnection.get_sync_client", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HTTPConnection.get_async_client", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HTTPConnection._validate_http_url", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HTTPConnection._headers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HTTPConnection.get_response", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "HTTPConnection.get_async_response", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "HTTPConnection.get_bytes", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "HTTPConnection.async_get_bytes", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "HTTPConnection.get_text", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HTTPConnection.async_get_text", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HTTPConnection.get_json", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HTTPConnection.async_get_json", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HTTPConnection.download_file", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "HTTPConnection.async_download_file", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HTTPConnection.reuse_client", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 50, "n_typed": 46, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 34, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.connections", "names": [ "vllm.connections.HTTPConnection", "vllm.connections.global_http_connection" ], "n_typable": 51, "n_typed": 46, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 34, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/device_allocator/cumem.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.device_allocator.cumem.python_unmap_and_release", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.device_allocator.cumem.init_module", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.device_allocator.cumem.AllocationData", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AllocationData.handle", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AllocationData.tag", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AllocationData.cpu_backup_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.device_allocator.cumem.libcudart", "n_typed": 0, "n_any": 1, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.device_allocator.cumem.create_and_map", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.device_allocator.cumem.get_pluggable_allocator", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.device_allocator.cumem.lib_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.device_allocator.cumem.python_create_and_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.device_allocator.cumem.HandleType", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.device_allocator.cumem.use_memory_pool_with_allocator", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.device_allocator.cumem.cumem_available", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.device_allocator.cumem.CuMemAllocator", "methods": [ { "kind": "function", "name": "CuMemAllocator.get_instance", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CuMemAllocator.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CuMemAllocator._python_malloc_callback", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CuMemAllocator._python_free_callback", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CuMemAllocator.sleep", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CuMemAllocator.wake_up", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CuMemAllocator.use_memory_pool", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CuMemAllocator.get_current_usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CuMemAllocator.instance", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CuMemAllocator.default_tag", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CuMemAllocator.pointer_to_data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CuMemAllocator.current_tag", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CuMemAllocator.allocator_and_pools", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CuMemAllocator.python_malloc_callback", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CuMemAllocator.python_free_callback", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 16, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 5, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.device_allocator.cumem.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.device_allocator.cumem.unmap_and_release", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.device_allocator.cumem", "names": [ "vllm.device_allocator.cumem.AllocationData", "vllm.device_allocator.cumem.CuMemAllocator", "vllm.device_allocator.cumem.HandleType", "vllm.device_allocator.cumem.create_and_map", "vllm.device_allocator.cumem.cumem_available", "vllm.device_allocator.cumem.get_pluggable_allocator", "vllm.device_allocator.cumem.init_module", "vllm.device_allocator.cumem.lib_name", "vllm.device_allocator.cumem.libcudart", "vllm.device_allocator.cumem.logger", "vllm.device_allocator.cumem.python_create_and_map", "vllm.device_allocator.cumem.python_unmap_and_release", "vllm.device_allocator.cumem.unmap_and_release", "vllm.device_allocator.cumem.use_memory_pool_with_allocator" ], "n_typable": 33, "n_typed": 26, "n_any": 1, "n_untyped": 6, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 6, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 5, "n_classes": 2, "n_attrs": 18, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/communication_op.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.communication_op.tensor_model_parallel_gather", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.distributed.communication_op.tensor_model_parallel_all_gather", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.distributed.communication_op.tensor_model_parallel_reduce_scatter", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.distributed.communication_op.tensor_model_parallel_all_reduce", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.distributed.communication_op.broadcast_tensor_dict", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.distributed.communication_op", "names": [ "vllm.distributed.communication_op.broadcast_tensor_dict", "vllm.distributed.communication_op.tensor_model_parallel_all_gather", "vllm.distributed.communication_op.tensor_model_parallel_all_reduce", "vllm.distributed.communication_op.tensor_model_parallel_gather", "vllm.distributed.communication_op.tensor_model_parallel_reduce_scatter" ], "n_typable": 15, "n_typed": 14, "n_any": 0, "n_untyped": 1, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 10, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/all2all.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.device_communicators.all2all.DeepEPHTAll2AllManager", "methods": [ { "kind": "function", "name": "DeepEPHTAll2AllManager.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepEPHTAll2AllManager._make_all2all_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepEPHTAll2AllManager.get_handle", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepEPHTAll2AllManager.set_num_sms", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 2, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.all2all.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.device_communicators.all2all.DeepEPAll2AllManagerBase", "methods": [ { "kind": "function", "name": "DeepEPAll2AllManagerBase.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepEPAll2AllManagerBase.get_handle", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepEPAll2AllManagerBase.dispatch_router_logits", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepEPAll2AllManagerBase.dispatch", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DeepEPAll2AllManagerBase.combine", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepEPAll2AllManagerBase.destroy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepEPAll2AllManagerBase.handle_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepEPAll2AllManagerBase.num_sms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 14, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.all2all.AgRsAll2AllManager", "methods": [ { "kind": "function", "name": "AgRsAll2AllManager.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AgRsAll2AllManager.dispatch_router_logits", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AgRsAll2AllManager.dispatch", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "AgRsAll2AllManager.combine", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AgRsAll2AllManager.destroy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 18, "n_typed": 14, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.all2all.MoriAll2AllManager", "methods": [ { "kind": "function", "name": "MoriAll2AllManager.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoriAll2AllManager._make_all2all_kwargs", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "MoriAll2AllManager._make_handle", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoriAll2AllManager.get_handle", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoriAll2AllManager.handle_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 10, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.all2all.NaiveAll2AllManager", "methods": [ { "kind": "function", "name": "NaiveAll2AllManager.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NaiveAll2AllManager.naive_multicast", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "NaiveAll2AllManager.dispatch_router_logits", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NaiveAll2AllManager.dispatch", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "NaiveAll2AllManager.combine", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NaiveAll2AllManager.destroy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 22, "n_typed": 18, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 16, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.all2all.FlashInferAllToAllManager", "methods": [ { "kind": "function", "name": "FlashInferAllToAllManager.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlashInferAllToAllManager.initialize", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FlashInferAllToAllManager.ensure_alltoall_workspace_initialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferAllToAllManager.get_handle", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferAllToAllManager.cleanup", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferAllToAllManager.rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferAllToAllManager.world_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferAllToAllManager.initialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferAllToAllManager.alltoall_info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 5, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.all2all.DeepEPLLAll2AllManager", "methods": [ { "kind": "function", "name": "DeepEPLLAll2AllManager.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepEPLLAll2AllManager._make_all2all_kwargs", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DeepEPLLAll2AllManager.get_handle", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepEPLLAll2AllManager.max_sms_used", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": [ "import-not-found" ] }, { "kind": "type", "rules": [ "import-not-found" ] } ], "name": "vllm.distributed.device_communicators.all2all", "names": [ "vllm.distributed.device_communicators.all2all.AgRsAll2AllManager", "vllm.distributed.device_communicators.all2all.DeepEPAll2AllManagerBase", "vllm.distributed.device_communicators.all2all.DeepEPHTAll2AllManager", "vllm.distributed.device_communicators.all2all.DeepEPLLAll2AllManager", "vllm.distributed.device_communicators.all2all.FlashInferAllToAllManager", "vllm.distributed.device_communicators.all2all.MoriAll2AllManager", "vllm.distributed.device_communicators.all2all.NaiveAll2AllManager", "vllm.distributed.device_communicators.all2all.logger" ], "n_typable": 116, "n_typed": 70, "n_any": 0, "n_untyped": 46, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 34, "n_method_overloads": 34, "n_method_params": 74, "n_classes": 7, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 2 }, { "path": "vllm/distributed/device_communicators/all_reduce_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.device_communicators.all_reduce_utils.gpu_p2p_access_check", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.all_reduce_utils", "names": [ "vllm.distributed.device_communicators.all_reduce_utils.gpu_p2p_access_check" ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/base_device_communicator.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.device_communicators.base_device_communicator.Cache", "methods": [ { "kind": "function", "name": "Cache.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Cache.get_or_create", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.base_device_communicator.DeviceCommunicatorBase", "methods": [ { "kind": "function", "name": "DeviceCommunicatorBase.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "DeviceCommunicatorBase.all_reduce", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeviceCommunicatorBase.all_gather", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeviceCommunicatorBase.all_gatherv", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeviceCommunicatorBase.reduce_scatter", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeviceCommunicatorBase.reduce_scatterv", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeviceCommunicatorBase.gather", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeviceCommunicatorBase.send", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeviceCommunicatorBase.recv", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeviceCommunicatorBase.broadcast", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeviceCommunicatorBase.destroy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeviceCommunicatorBase.prepare_communication_buffer_for_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeviceCommunicatorBase.dispatch_router_logits", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeviceCommunicatorBase.dispatch", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DeviceCommunicatorBase.combine", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeviceCommunicatorBase.batch_isend_irecv", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeviceCommunicatorBase.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeviceCommunicatorBase.cpu_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeviceCommunicatorBase.device_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeviceCommunicatorBase.unique_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeviceCommunicatorBase.is_ep_communicator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeviceCommunicatorBase.use_all2all", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeviceCommunicatorBase.all2all_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeviceCommunicatorBase.all2all_manager", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeviceCommunicatorBase.rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeviceCommunicatorBase.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeviceCommunicatorBase.ranks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeviceCommunicatorBase.global_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeviceCommunicatorBase.global_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeviceCommunicatorBase.rank_in_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 70, "n_typed": 54, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 40, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.base_device_communicator.All2AllManagerBase", "methods": [ { "kind": "function", "name": "All2AllManagerBase.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "All2AllManagerBase.get_handle", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "All2AllManagerBase.dispatch_router_logits", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "All2AllManagerBase.dispatch", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "All2AllManagerBase.set_num_sms", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "All2AllManagerBase.max_sms_used", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "All2AllManagerBase.combine", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "All2AllManagerBase.destroy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "All2AllManagerBase.rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "All2AllManagerBase.world_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "All2AllManagerBase.cpu_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "All2AllManagerBase.tcp_store_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "All2AllManagerBase.dp_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "All2AllManagerBase.tp_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "All2AllManagerBase.dp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "All2AllManagerBase.dp_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "All2AllManagerBase.internode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 17, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 15, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.base_device_communicator", "names": [ "vllm.distributed.device_communicators.base_device_communicator.All2AllManagerBase", "vllm.distributed.device_communicators.base_device_communicator.Cache", "vllm.distributed.device_communicators.base_device_communicator.DeviceCommunicatorBase" ], "n_typable": 106, "n_typed": 71, "n_any": 0, "n_untyped": 35, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 26, "n_method_overloads": 26, "n_method_params": 57, "n_classes": 3, "n_attrs": 23, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/cpu_communicator.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.distributed.device_communicators.cpu_communicator.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.device_communicators.cpu_communicator.CpuCommunicator", "methods": [ { "kind": "function", "name": "CpuCommunicator.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CpuCommunicator._all_group_ranks_share_shm_group_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CpuCommunicator.all_reduce", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CpuCommunicator.gather", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CpuCommunicator.all_gather", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CpuCommunicator.send_tensor_dict", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CpuCommunicator.recv_tensor_dict", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CpuCommunicator.dispatch_router_logits", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CpuCommunicator.dispatch", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CpuCommunicator.combine", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CpuCommunicator.dist_module", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CpuCommunicator.all2all_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CpuCommunicator.all2all_manager", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 37, "n_typed": 31, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 24, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.cpu_communicator", "names": [ "vllm.distributed.device_communicators.cpu_communicator.CpuCommunicator", "vllm.distributed.device_communicators.cpu_communicator.logger" ], "n_typable": 38, "n_typed": 31, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 24, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/cuda_communicator.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.device_communicators.cuda_communicator.CudaCommunicator", "methods": [ { "kind": "function", "name": "CudaCommunicator.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "CudaCommunicator.all_reduce", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaCommunicator.reduce_scatter", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CudaCommunicator.reduce_scatterv", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CudaCommunicator.send", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CudaCommunicator.recv", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CudaCommunicator.broadcast", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CudaCommunicator.destroy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaCommunicator.all_gatherv", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CudaCommunicator.dispatch_router_logits", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CudaCommunicator.dispatch", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CudaCommunicator.combine", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CudaCommunicator.batch_isend_irecv", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CudaCommunicator.use_custom_allreduce", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaCommunicator.use_torch_symm_mem", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaCommunicator.use_flashinfer_allreduce", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaCommunicator.pynccl_comm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudaCommunicator.ca_comm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudaCommunicator.qr_comm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudaCommunicator.symm_mem_comm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudaCommunicator.fi_ar_comm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudaCommunicator.all2all_manager", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 57, "n_typed": 45, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 35, "n_attrs": 9, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.cuda_communicator.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.cuda_communicator", "names": [ "vllm.distributed.device_communicators.cuda_communicator.CudaCommunicator", "vllm.distributed.device_communicators.cuda_communicator.logger" ], "n_typable": 58, "n_typed": 45, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 35, "n_classes": 1, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/cuda_wrapper.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.device_communicators.cuda_wrapper.Function", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Function.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Function.restype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Function.argtypes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.cuda_wrapper.CudaRTLibrary", "methods": [ { "kind": "function", "name": "CudaRTLibrary.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaRTLibrary.CUDART_CHECK", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaRTLibrary.cudaGetErrorString", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaRTLibrary.cudaSetDevice", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaRTLibrary.cudaDeviceSynchronize", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaRTLibrary.cudaDeviceReset", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaRTLibrary.cudaMalloc", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaRTLibrary.cudaFree", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaRTLibrary.cudaMemset", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CudaRTLibrary.cudaMemcpy", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CudaRTLibrary.cudaIpcGetMemHandle", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaRTLibrary.cudaIpcOpenMemHandle", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CudaRTLibrary.exported_functions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaRTLibrary.cuda_to_hip_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CudaRTLibrary.path_to_library_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudaRTLibrary.path_to_dict_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudaRTLibrary.lib", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaRTLibrary.funcs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 27, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 14, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.cuda_wrapper.cudaIpcMemHandle_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "cudaIpcMemHandle_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.cuda_wrapper.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.cuda_wrapper", "names": [ "vllm.distributed.device_communicators.cuda_wrapper.CudaRTLibrary", "vllm.distributed.device_communicators.cuda_wrapper.Function", "vllm.distributed.device_communicators.cuda_wrapper.cudaIpcMemHandle_t", "vllm.distributed.device_communicators.cuda_wrapper.logger" ], "n_typable": 32, "n_typed": 27, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 14, "n_classes": 3, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/custom_all_reduce.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.distributed.device_communicators.custom_all_reduce.custom_ar", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.distributed.device_communicators.custom_all_reduce.is_weak_contiguous", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.custom_all_reduce.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.device_communicators.custom_all_reduce.CustomAllreduce", "methods": [ { "kind": "function", "name": "CustomAllreduce.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CustomAllreduce.capture", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CustomAllreduce.register_graph_buffers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CustomAllreduce.should_custom_ar", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CustomAllreduce.all_reduce", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CustomAllreduce.custom_all_reduce", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CustomAllreduce.close", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CustomAllreduce.__del__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CustomAllreduce.create_shared_buffer", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CustomAllreduce.free_shared_buffer", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CustomAllreduce._SUPPORTED_WORLD_SIZES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CustomAllreduce.disabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CustomAllreduce.group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CustomAllreduce.rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CustomAllreduce.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CustomAllreduce.meta_ptrs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CustomAllreduce.buffer_ptrs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CustomAllreduce.rank_data", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CustomAllreduce.max_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CustomAllreduce.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CustomAllreduce.fully_connected", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 17, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 15, "n_attrs": 11, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.custom_all_reduce", "names": [ "vllm.distributed.device_communicators.custom_all_reduce.CustomAllreduce", "vllm.distributed.device_communicators.custom_all_reduce.custom_ar", "vllm.distributed.device_communicators.custom_all_reduce.is_weak_contiguous", "vllm.distributed.device_communicators.custom_all_reduce.logger" ], "n_typable": 38, "n_typed": 18, "n_any": 0, "n_untyped": 20, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 15, "n_classes": 1, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/flashinfer_all_reduce.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.device_communicators.flashinfer_all_reduce.get_fi_ar_workspace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.flashinfer_all_reduce.fi_ar_available", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.distributed.device_communicators.flashinfer_all_reduce.get_fi_ar_quant_workspace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.device_communicators.flashinfer_all_reduce.initialize_fi_ar_quant_workspace", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.distributed.device_communicators.flashinfer_all_reduce.initialize_fi_ar_workspace", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.distributed.device_communicators.flashinfer_all_reduce.destroy_fi_ar_workspace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.flashinfer_all_reduce.FlashInferAllReduce", "methods": [ { "kind": "function", "name": "FlashInferAllReduce.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlashInferAllReduce._ensure_workspace", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlashInferAllReduce.should_use_fi_ar", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferAllReduce.all_reduce", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferAllReduce.destroy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferAllReduce.disabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferAllReduce.group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferAllReduce.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferAllReduce.rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferAllReduce.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferAllReduce.max_workspace_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferAllReduce.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 9, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.flashinfer_all_reduce.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": [ "no-redef" ] } ], "name": "vllm.distributed.device_communicators.flashinfer_all_reduce", "names": [ "vllm.distributed.device_communicators.flashinfer_all_reduce.FlashInferAllReduce", "vllm.distributed.device_communicators.flashinfer_all_reduce.destroy_fi_ar_workspace", "vllm.distributed.device_communicators.flashinfer_all_reduce.fi_ar_available", "vllm.distributed.device_communicators.flashinfer_all_reduce.get_fi_ar_quant_workspace", "vllm.distributed.device_communicators.flashinfer_all_reduce.get_fi_ar_workspace", "vllm.distributed.device_communicators.flashinfer_all_reduce.initialize_fi_ar_quant_workspace", "vllm.distributed.device_communicators.flashinfer_all_reduce.initialize_fi_ar_workspace", "vllm.distributed.device_communicators.flashinfer_all_reduce.logger" ], "n_typable": 36, "n_typed": 23, "n_any": 0, "n_untyped": 13, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 12, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_classes": 1, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/distributed/device_communicators/mnnvl_compat.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.device_communicators.mnnvl_compat.CustomCommunicator", "methods": [ { "kind": "function", "name": "CustomCommunicator.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CustomCommunicator.Get_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CustomCommunicator.Get_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CustomCommunicator.allgather", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CustomCommunicator.bcast", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CustomCommunicator.barrier", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CustomCommunicator.Split", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 13, "n_typed": 8, "n_any": 2, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.mnnvl_compat.CommBackend", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.mnnvl_compat", "names": [ "vllm.distributed.device_communicators.mnnvl_compat.CommBackend", "vllm.distributed.device_communicators.mnnvl_compat.CustomCommunicator" ], "n_typable": 13, "n_typed": 8, "n_any": 2, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 6, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/pynccl.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.device_communicators.pynccl.register_nccl_symmetric_ops", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.pynccl.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.device_communicators.pynccl.PyNcclCommunicator", "methods": [ { "kind": "function", "name": "PyNcclCommunicator.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PyNcclCommunicator.all_reduce", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PyNcclCommunicator.all_gather", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PyNcclCommunicator.all_gatherv", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PyNcclCommunicator.reduce_scatter", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PyNcclCommunicator.reduce_scatterv", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PyNcclCommunicator.send", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PyNcclCommunicator.recv", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PyNcclCommunicator.broadcast", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PyNcclCommunicator.group_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PyNcclCommunicator.group_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PyNcclCommunicator.register_comm_window", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PyNcclCommunicator.register_comm_window_raw", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PyNcclCommunicator.deregister_comm_window", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PyNcclCommunicator.batch_isend_irecv", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PyNcclCommunicator.group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PyNcclCommunicator.available", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PyNcclCommunicator.disabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PyNcclCommunicator.nccl_version", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PyNcclCommunicator.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PyNcclCommunicator.rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PyNcclCommunicator.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PyNcclCommunicator.nccl", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PyNcclCommunicator.unique_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PyNcclCommunicator.comm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 63, "n_typed": 30, "n_any": 0, "n_untyped": 33, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 38, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.pynccl", "names": [ "vllm.distributed.device_communicators.pynccl.PyNcclCommunicator", "vllm.distributed.device_communicators.pynccl.logger", "vllm.distributed.device_communicators.pynccl.register_nccl_symmetric_ops" ], "n_typable": 66, "n_typed": 30, "n_any": 0, "n_untyped": 36, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 38, "n_classes": 1, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/pynccl_allocator.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.device_communicators.pynccl_allocator.is_symmetric_memory_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.device_communicators.pynccl_allocator.is_symmetric_memory_tensor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.distributed.device_communicators.pynccl_allocator.compile_nccl_allocator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.pynccl_allocator.nccl_symm_mem_context", "methods": [ { "kind": "function", "name": "nccl_symm_mem_context.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "nccl_symm_mem_context.__enter__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "nccl_symm_mem_context.__exit__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "nccl_symm_mem_context.disabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "nccl_symm_mem_context.pynccl_comm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "nccl_symm_mem_context.is_graph_capture", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "nccl_symm_mem_context.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 3, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.device_communicators.pynccl_allocator.get_nccl_mem_pool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.device_communicators.pynccl_allocator.set_graph_pool_id", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.pynccl_allocator.nccl_allocator_source", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.pynccl_allocator.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.pynccl_allocator", "names": [ "vllm.distributed.device_communicators.pynccl_allocator.compile_nccl_allocator", "vllm.distributed.device_communicators.pynccl_allocator.get_nccl_mem_pool", "vllm.distributed.device_communicators.pynccl_allocator.is_symmetric_memory_enabled", "vllm.distributed.device_communicators.pynccl_allocator.is_symmetric_memory_tensor", "vllm.distributed.device_communicators.pynccl_allocator.logger", "vllm.distributed.device_communicators.pynccl_allocator.nccl_allocator_source", "vllm.distributed.device_communicators.pynccl_allocator.nccl_symm_mem_context", "vllm.distributed.device_communicators.pynccl_allocator.set_graph_pool_id" ], "n_typable": 20, "n_typed": 5, "n_any": 1, "n_untyped": 14, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 2, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/pynccl_wrapper.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.device_communicators.pynccl_wrapper.ncclRedOpTypeEnum", "methods": [ { "kind": "function", "name": "ncclRedOpTypeEnum.from_torch", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ncclRedOpTypeEnum.ncclSum", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclRedOpTypeEnum.ncclProd", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclRedOpTypeEnum.ncclMax", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclRedOpTypeEnum.ncclMin", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclRedOpTypeEnum.ncclAvg", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclRedOpTypeEnum.ncclNumOps", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.pynccl_wrapper.ncclDataTypeEnum", "methods": [ { "kind": "function", "name": "ncclDataTypeEnum.from_torch", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ncclDataTypeEnum.ncclInt8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclChar", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclUint8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclInt32", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclInt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclUint32", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclInt64", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclUint64", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclFloat16", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclHalf", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclFloat32", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclFloat", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclFloat64", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclDouble", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclBfloat16", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclFloat8e4m3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ncclDataTypeEnum.ncclNumTypes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 17, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.pynccl_wrapper.ncclComm_t", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.pynccl_wrapper.NCCLLibrary", "methods": [ { "kind": "function", "name": "NCCLLibrary.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NCCLLibrary.ncclGetErrorString", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NCCLLibrary.NCCL_CHECK", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NCCLLibrary.ncclGetRawVersion", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NCCLLibrary.ncclGetVersion", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NCCLLibrary.ncclGetUniqueId", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NCCLLibrary.unique_id_from_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NCCLLibrary.ncclCommInitRank", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "NCCLLibrary.ncclAllReduce", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "NCCLLibrary.ncclReduce", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "NCCLLibrary.ncclReduceScatter", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "NCCLLibrary.ncclAllGather", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "NCCLLibrary.ncclSend", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "NCCLLibrary.ncclRecv", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "NCCLLibrary.ncclBroadcast", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "NCCLLibrary.ncclCommDestroy", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NCCLLibrary.ncclGroupStart", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NCCLLibrary.ncclGroupEnd", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NCCLLibrary.ncclCommWindowRegister", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NCCLLibrary.ncclCommWindowDeregister", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NCCLLibrary.exported_functions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NCCLLibrary.path_to_library_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NCCLLibrary.path_to_dict_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NCCLLibrary.lib", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 85, "n_typed": 82, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 20, "n_method_overloads": 20, "n_method_params": 61, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.pynccl_wrapper.buffer_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.pynccl_wrapper.cudaStream_t", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.pynccl_wrapper.ncclUniqueId", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ncclUniqueId._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.pynccl_wrapper", "names": [ "vllm.distributed.device_communicators.pynccl_wrapper.NCCLLibrary", "vllm.distributed.device_communicators.pynccl_wrapper.buffer_type", "vllm.distributed.device_communicators.pynccl_wrapper.cudaStream_t", "vllm.distributed.device_communicators.pynccl_wrapper.ncclComm_t", "vllm.distributed.device_communicators.pynccl_wrapper.ncclDataTypeEnum", "vllm.distributed.device_communicators.pynccl_wrapper.ncclRedOpTypeEnum", "vllm.distributed.device_communicators.pynccl_wrapper.ncclUniqueId" ], "n_typable": 89, "n_typed": 86, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 22, "n_method_overloads": 22, "n_method_params": 63, "n_classes": 4, "n_attrs": 31, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/quick_all_reduce.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.distributed.device_communicators.quick_all_reduce.quick_ar", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.quick_all_reduce.MB", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.quick_all_reduce.QuickAllReduce", "methods": [ { "kind": "function", "name": "QuickAllReduce.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QuickAllReduce.init_quick_all_reduce", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QuickAllReduce._rocm_arch_available", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QuickAllReduce.create_shared_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QuickAllReduce.should_quick_allreduce", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuickAllReduce.quick_all_reduce", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QuickAllReduce.close", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QuickAllReduce.__del__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QuickAllReduce._SUPPORTED_WORLD_SIZES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QuickAllReduce._SUPPORTED_DTYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QuickAllReduce._QR_MIN_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QuickAllReduce.disabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuickAllReduce.group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuickAllReduce.rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuickAllReduce.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuickAllReduce.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuickAllReduce.fully_connected", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 6, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 5, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.quick_all_reduce.QuickReduceRegime", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "QuickReduceRegime.FP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QuickReduceRegime.INT8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QuickReduceRegime.INT6", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QuickReduceRegime.INT4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QuickReduceRegime.NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.device_communicators.quick_all_reduce.is_weak_contiguous", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.quick_all_reduce.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.quick_all_reduce", "names": [ "vllm.distributed.device_communicators.quick_all_reduce.MB", "vllm.distributed.device_communicators.quick_all_reduce.QuickAllReduce", "vllm.distributed.device_communicators.quick_all_reduce.QuickReduceRegime", "vllm.distributed.device_communicators.quick_all_reduce.is_weak_contiguous", "vllm.distributed.device_communicators.quick_all_reduce.logger", "vllm.distributed.device_communicators.quick_all_reduce.quick_ar" ], "n_typable": 22, "n_typed": 7, "n_any": 0, "n_untyped": 15, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 5, "n_classes": 2, "n_attrs": 17, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/ray_communicator.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.device_communicators.ray_communicator.RayPPCommunicator", "methods": [ { "kind": "function", "name": "RayPPCommunicator.__init__", "n_typed": 5, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "RayPPCommunicator._build_actor_rank_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RayPPCommunicator.initialize", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RayPPCommunicator.get_actor_handles", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RayPPCommunicator.get_rank", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RayPPCommunicator.get_self_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RayPPCommunicator.get_world_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RayPPCommunicator.send", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RayPPCommunicator.recv", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "RayPPCommunicator.allgather", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RayPPCommunicator.allreduce", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RayPPCommunicator.reducescatter", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RayPPCommunicator.destroy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RayPPCommunicator.get_transport_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RayPPCommunicator.generate_communicator_id", "n_typed": 0, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "RayPPCommunicator.recv_stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "RayPPCommunicator.send_stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "RayPPCommunicator._comm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 40, "n_typed": 31, "n_any": 2, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 22, "n_attrs": 1, "n_properties": 2 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.ray_communicator.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.ray_communicator", "names": [ "vllm.distributed.device_communicators.ray_communicator.RayPPCommunicator", "vllm.distributed.device_communicators.ray_communicator.logger" ], "n_typable": 41, "n_typed": 31, "n_any": 2, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 22, "n_classes": 1, "n_attrs": 2, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/shm_broadcast.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.device_communicators.shm_broadcast.to_bytes_big", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.distributed.device_communicators.shm_broadcast.memory_fence", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.shm_broadcast.SpinSleepTimer", "methods": [ { "kind": "function", "name": "SpinSleepTimer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SpinSleepTimer.record_activity", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpinSleepTimer.spin", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SpinSleepTimer.last_activity", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpinSleepTimer.busy_loop_s", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpinSleepTimer.wait_sleep_s", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 2, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.shm_broadcast.ShmRingBuffer", "methods": [ { "kind": "function", "name": "ShmRingBuffer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ShmRingBuffer.handle", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ShmRingBuffer.__reduce__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ShmRingBuffer.__del__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ShmRingBuffer.get_data", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ShmRingBuffer.get_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ShmRingBuffer.n_reader", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShmRingBuffer.metadata_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShmRingBuffer.max_chunk_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShmRingBuffer.max_chunks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShmRingBuffer.total_bytes_of_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShmRingBuffer.data_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShmRingBuffer.metadata_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShmRingBuffer.is_creator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShmRingBuffer.shared_memory", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 6, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_attrs": 9, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.device_communicators.shm_broadcast.long_wait_time_msg", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.distributed.device_communicators.shm_broadcast.Handle", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Handle.local_reader_ranks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Handle.buffer_handle", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Handle.local_subscribe_addr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Handle.remote_subscribe_addr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Handle.remote_addr_ipv6", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.shm_broadcast.MessageQueue", "methods": [ { "kind": "function", "name": "MessageQueue.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MessageQueue.export_handle", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MessageQueue.create_from_handle", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MessageQueue.wait_until_ready", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MessageQueue.acquire_write", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MessageQueue.acquire_read", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MessageQueue.enqueue", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MessageQueue.dequeue", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MessageQueue.recv", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MessageQueue.broadcast_object", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MessageQueue.create_from_process_group_single_reader", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MessageQueue.create_from_process_group", "n_typed": 4, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MessageQueue.n_local_reader", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MessageQueue.n_remote_reader", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MessageQueue.local_reader_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MessageQueue.handle", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MessageQueue.buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MessageQueue.local_socket", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MessageQueue.current_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MessageQueue.remote_socket", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 51, "n_typed": 25, "n_any": 1, "n_untyped": 25, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 31, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.shm_broadcast.from_bytes_big", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.device_communicators.shm_broadcast.SpinTimer", "methods": [ { "kind": "function", "name": "SpinTimer.record_activity", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpinTimer.spin", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.shm_broadcast.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.shm_broadcast", "names": [ "vllm.distributed.device_communicators.shm_broadcast.Handle", "vllm.distributed.device_communicators.shm_broadcast.MessageQueue", "vllm.distributed.device_communicators.shm_broadcast.ShmRingBuffer", "vllm.distributed.device_communicators.shm_broadcast.SpinSleepTimer", "vllm.distributed.device_communicators.shm_broadcast.SpinTimer", "vllm.distributed.device_communicators.shm_broadcast.from_bytes_big", "vllm.distributed.device_communicators.shm_broadcast.logger", "vllm.distributed.device_communicators.shm_broadcast.long_wait_time_msg", "vllm.distributed.device_communicators.shm_broadcast.memory_fence", "vllm.distributed.device_communicators.shm_broadcast.to_bytes_big" ], "n_typable": 90, "n_typed": 38, "n_any": 1, "n_untyped": 51, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 3, "n_methods": 23, "n_method_overloads": 23, "n_method_params": 39, "n_classes": 5, "n_attrs": 27, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/shm_object_storage.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.device_communicators.shm_object_storage.SingleWriterShmObjectStorage", "methods": [ { "kind": "function", "name": "SingleWriterShmObjectStorage.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "SingleWriterShmObjectStorage.clear", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SingleWriterShmObjectStorage.copy_to_buffer", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "SingleWriterShmObjectStorage.increment_writer_flag", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SingleWriterShmObjectStorage.increment_reader_flag", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SingleWriterShmObjectStorage.free_unused", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SingleWriterShmObjectStorage.is_cached", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SingleWriterShmObjectStorage.get_cached", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SingleWriterShmObjectStorage.put", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleWriterShmObjectStorage.get", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleWriterShmObjectStorage.touch", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SingleWriterShmObjectStorage.close", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SingleWriterShmObjectStorage.handle", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SingleWriterShmObjectStorage.create_from_handle", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SingleWriterShmObjectStorage.default_is_free_check", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SingleWriterShmObjectStorage.max_object_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmObjectStorage.n_readers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmObjectStorage.serde_class", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmObjectStorage.ser_de", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmObjectStorage.ring_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmObjectStorage.is_writer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmObjectStorage.flag_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmObjectStorage.key_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmObjectStorage.id_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmObjectStorage.writer_flag", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 49, "n_typed": 38, "n_any": 2, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 24, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.shm_object_storage.ShmObjectStorageHandle", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ShmObjectStorageHandle.max_object_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ShmObjectStorageHandle.n_readers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ShmObjectStorageHandle.ring_buffer_handle", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ShmObjectStorageHandle.serde_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ShmObjectStorageHandle.reader_lock", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.shm_object_storage.ObjectSerde", "methods": [ { "kind": "function", "name": "ObjectSerde.serialize", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ObjectSerde.deserialize", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 2, "n_any": 2, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.shm_object_storage.MsgpackSerde", "methods": [ { "kind": "function", "name": "MsgpackSerde.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MsgpackSerde.serialize", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackSerde.deserialize", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MsgpackSerde.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MsgpackSerde.tensor_decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MsgpackSerde.mm_decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 2, "n_any": 2, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.shm_object_storage.SingleWriterShmRingBuffer", "methods": [ { "kind": "function", "name": "SingleWriterShmRingBuffer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SingleWriterShmRingBuffer.handle", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SingleWriterShmRingBuffer.clear", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SingleWriterShmRingBuffer.close", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SingleWriterShmRingBuffer.__del__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SingleWriterShmRingBuffer.int2byte", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SingleWriterShmRingBuffer.byte2int", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SingleWriterShmRingBuffer.allocate_buf", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SingleWriterShmRingBuffer.access_buf", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SingleWriterShmRingBuffer.free_buf", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SingleWriterShmRingBuffer.data_buffer_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmRingBuffer.is_writer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmRingBuffer.ID_NBYTES", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmRingBuffer.ID_MAX", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmRingBuffer.SIZE_NBYTES", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmRingBuffer.MD_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmRingBuffer.monotonic_id_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmRingBuffer.monotonic_id_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmRingBuffer.data_buffer_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmRingBuffer.data_buffer_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmRingBuffer.metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SingleWriterShmRingBuffer.shared_memory", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 16, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 9, "n_attrs": 12, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.shm_object_storage.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.shm_object_storage", "names": [ "vllm.distributed.device_communicators.shm_object_storage.MsgpackSerde", "vllm.distributed.device_communicators.shm_object_storage.ObjectSerde", "vllm.distributed.device_communicators.shm_object_storage.ShmObjectStorageHandle", "vllm.distributed.device_communicators.shm_object_storage.SingleWriterShmObjectStorage", "vllm.distributed.device_communicators.shm_object_storage.SingleWriterShmRingBuffer", "vllm.distributed.device_communicators.shm_object_storage.logger" ], "n_typable": 93, "n_typed": 58, "n_any": 6, "n_untyped": 29, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 30, "n_method_overloads": 30, "n_method_params": 37, "n_classes": 5, "n_attrs": 31, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/symm_mem.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.distributed.device_communicators.symm_mem.symm_mem_available", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.distributed.device_communicators.symm_mem.SymmMemCommunicator", "methods": [ { "kind": "function", "name": "SymmMemCommunicator.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SymmMemCommunicator.should_use_symm_mem", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SymmMemCommunicator.all_reduce", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SymmMemCommunicator._WORLD_SIZES_MULTIMEM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SymmMemCommunicator.disabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SymmMemCommunicator.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SymmMemCommunicator.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SymmMemCommunicator.group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SymmMemCommunicator.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SymmMemCommunicator.device_capability", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SymmMemCommunicator.force_multimem", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SymmMemCommunicator.max_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SymmMemCommunicator.buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 8, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.symm_mem.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.symm_mem", "names": [ "vllm.distributed.device_communicators.symm_mem.SymmMemCommunicator", "vllm.distributed.device_communicators.symm_mem.logger", "vllm.distributed.device_communicators.symm_mem.symm_mem_available" ], "n_typable": 20, "n_typed": 8, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_classes": 1, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/device_communicators/xpu_communicator.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.device_communicators.xpu_communicator.XpuCommunicator", "methods": [ { "kind": "function", "name": "XpuCommunicator.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "XpuCommunicator.all_reduce", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XpuCommunicator.reduce_scatter", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "XpuCommunicator.reduce_scatterv", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "XpuCommunicator.all_gatherv", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "XpuCommunicator.gather", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "XpuCommunicator.broadcast", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "XpuCommunicator.dispatch_router_logits", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "XpuCommunicator.dispatch", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "XpuCommunicator.combine", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "XpuCommunicator.all2all_manager", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 34, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 29, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.device_communicators.xpu_communicator.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.device_communicators.xpu_communicator", "names": [ "vllm.distributed.device_communicators.xpu_communicator.XpuCommunicator", "vllm.distributed.device_communicators.xpu_communicator.logger" ], "n_typable": 41, "n_typed": 34, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 29, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/ec_transfer/ec_transfer_state.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.ec_transfer.ec_transfer_state.has_ec_transfer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.ec_transfer.ec_transfer_state.ensure_ec_transfer_initialized", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.distributed.ec_transfer.ec_transfer_state.get_ec_transfer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.distributed.ec_transfer.ec_transfer_state", "names": [ "vllm.distributed.ec_transfer.ec_transfer_state.ensure_ec_transfer_initialized", "vllm.distributed.ec_transfer.ec_transfer_state.get_ec_transfer", "vllm.distributed.ec_transfer.ec_transfer_state.has_ec_transfer" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/ec_transfer/ec_connector/base.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.distributed.ec_transfer.ec_connector.base.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.ec_transfer.ec_connector.base.ECConnectorRole", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ECConnectorRole.SCHEDULER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ECConnectorRole.WORKER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.ec_transfer.ec_connector.base.ECConnectorMetadata", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.ec_transfer.ec_connector.base.ECConnectorBase", "methods": [ { "kind": "function", "name": "ECConnectorBase.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ECConnectorBase.bind_connector_metadata", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ECConnectorBase.clear_connector_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ECConnectorBase._get_connector_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ECConnectorBase.register_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ECConnectorBase.start_load_caches", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ECConnectorBase.save_caches", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ECConnectorBase.get_finished", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ECConnectorBase.has_cache_item", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ECConnectorBase.update_state_after_alloc", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ECConnectorBase.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ECConnectorBase.update_connector_output", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ECConnectorBase.request_finished", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "ECConnectorBase.role", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ECConnectorBase.is_producer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ECConnectorBase.is_consumer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 32, "n_typed": 26, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 16, "n_attrs": 0, "n_properties": 3 } ], "type_ignores": [], "name": "vllm.distributed.ec_transfer.ec_connector.base", "names": [ "vllm.distributed.ec_transfer.ec_connector.base.ECConnectorBase", "vllm.distributed.ec_transfer.ec_connector.base.ECConnectorMetadata", "vllm.distributed.ec_transfer.ec_connector.base.ECConnectorRole", "vllm.distributed.ec_transfer.ec_connector.base.logger" ], "n_typable": 33, "n_typed": 26, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 16, "n_classes": 3, "n_attrs": 3, "n_properties": 3, "n_type_ignores": 0 }, { "path": "vllm/distributed/ec_transfer/ec_connector/example_connector.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.ec_transfer.ec_connector.example_connector.ECExampleConnectorMetadata", "methods": [ { "kind": "function", "name": "ECExampleConnectorMetadata.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ECExampleConnectorMetadata.add_mm_data", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ECExampleConnectorMetadata.mm_datas", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.ec_transfer.ec_connector.example_connector.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.ec_transfer.ec_connector.example_connector.ECExampleConnector", "methods": [ { "kind": "function", "name": "ECExampleConnector.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ECExampleConnector.start_load_caches", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ECExampleConnector.save_caches", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ECExampleConnector.has_cache_item", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ECExampleConnector.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ECExampleConnector.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ECExampleConnector._found_match_for_mm_data", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ECExampleConnector._generate_foldername_debug", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ECExampleConnector._generate_filename_debug", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 24, "n_typed": 17, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 15, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.ec_transfer.ec_connector.example_connector.MMMeta", "methods": [ { "kind": "function", "name": "MMMeta.make_meta", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MMMeta.mm_hash", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MMMeta.num_token", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.ec_transfer.ec_connector.example_connector", "names": [ "vllm.distributed.ec_transfer.ec_connector.example_connector.ECExampleConnector", "vllm.distributed.ec_transfer.ec_connector.example_connector.ECExampleConnectorMetadata", "vllm.distributed.ec_transfer.ec_connector.example_connector.MMMeta", "vllm.distributed.ec_transfer.ec_connector.example_connector.logger" ], "n_typable": 31, "n_typed": 19, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 18, "n_classes": 3, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/ec_transfer/ec_connector/factory.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.ec_transfer.ec_connector.factory.ECConnectorFactory", "methods": [ { "kind": "function", "name": "ECConnectorFactory.register_connector", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ECConnectorFactory.create_connector", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ECConnectorFactory.get_connector_class", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ECConnectorFactory._registry", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.ec_transfer.ec_connector.factory.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.ec_transfer.ec_connector.factory", "names": [ "vllm.distributed.ec_transfer.ec_connector.factory.ECConnectorFactory", "vllm.distributed.ec_transfer.ec_connector.factory.logger" ], "n_typable": 11, "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/elastic_ep/elastic_execute.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.elastic_ep.elastic_execute.broadcast_expert_mapping", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "attr", "name": "vllm.distributed.elastic_ep.elastic_execute.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.distributed.elastic_ep.elastic_execute.batch_transfer_weights", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.distributed.elastic_ep.elastic_execute.ElasticEPScalingExecutor", "methods": [ { "kind": "function", "name": "ElasticEPScalingExecutor.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ElasticEPScalingExecutor.execute", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ElasticEPScalingExecutor.create_standby_groups", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ElasticEPScalingExecutor.transfer_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ElasticEPScalingExecutor.broadcast_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingExecutor.switch_and_remove", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingExecutor.switch_and_prepare", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingExecutor.perform_eplb_reshuffle", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ElasticEPScalingExecutor.receive_weights", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingExecutor.receive_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingExecutor.prepare_new_worker", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "ElasticEPScalingExecutor.worker", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ElasticEPScalingExecutor.worker_ref", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ElasticEPScalingExecutor.reconfig_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 14, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 8, "n_attrs": 2, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.distributed.elastic_ep.elastic_execute", "names": [ "vllm.distributed.elastic_ep.elastic_execute.ElasticEPScalingExecutor", "vllm.distributed.elastic_ep.elastic_execute.batch_transfer_weights", "vllm.distributed.elastic_ep.elastic_execute.broadcast_expert_mapping", "vllm.distributed.elastic_ep.elastic_execute.logger" ], "n_typable": 36, "n_typed": 27, "n_any": 0, "n_untyped": 9, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 11, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 8, "n_classes": 1, "n_attrs": 3, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/distributed/elastic_ep/elastic_state.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.elastic_ep.elastic_state.ElasticEPScalingState", "methods": [ { "kind": "function", "name": "ElasticEPScalingState.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "ElasticEPScalingState.progress", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingState._execute_tcp_store_barrier", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ElasticEPScalingState._staged_barrier", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ElasticEPScalingState._progress_existing_engine", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingState._progress_new_engine", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingState._progress_remaining_engine", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingState._progress_removing_engine", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingState.handle_notification", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ElasticEPScalingState.is_complete", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingState._create_standby_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingState._transfer_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingState._transfer_expert_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingState._sync_kv_cache_memory_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingState._switch_and_prepare", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingState._eplb_reshuffle", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingState._eplb_reshuffle_before_scale_down", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingState._switch_and_remove", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ElasticEPScalingState._update_parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "ElasticEPScalingState.model_executor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ElasticEPScalingState.engine_core", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ElasticEPScalingState.model_executor_ref", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ElasticEPScalingState.engine_core_ref", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ElasticEPScalingState.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ElasticEPScalingState.old_dp_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ElasticEPScalingState.old_dp_store", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ElasticEPScalingState.new_parallel_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ElasticEPScalingState.new_dp_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ElasticEPScalingState.new_dp_store", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ElasticEPScalingState.worker_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ElasticEPScalingState.scale_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ElasticEPScalingState.reconfig_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ElasticEPScalingState.state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 48, "n_typed": 21, "n_any": 0, "n_untyped": 27, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 15, "n_attrs": 12, "n_properties": 2 }, { "kind": "class", "name": "vllm.distributed.elastic_ep.elastic_state.ScaleUpExistingEngineState", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ScaleUpExistingEngineState.WAIT_NEW_CORE_ENGINES_INIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleUpExistingEngineState.CREATE_STANDBY_GROUPS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleUpExistingEngineState.TRANSFER_EXPERT_MAPPING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleUpExistingEngineState.WAIT_NEW_CORE_ENGINES_WEIGHTS_INIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleUpExistingEngineState.TRANSFER_WEIGHTS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleUpExistingEngineState.SYNC_KV_CACHE_MEMORY_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleUpExistingEngineState.SWITCH_AND_PREPARE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleUpExistingEngineState.EPLB_RESHUFFLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleUpExistingEngineState.COMPLETE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 9, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.elastic_ep.elastic_state.WorkerType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.elastic_ep.elastic_state.ScaleDownRemainingEngineState", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ScaleDownRemainingEngineState.PREPARE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleDownRemainingEngineState.EPLB_RESHUFFLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleDownRemainingEngineState.SWITCH_AND_PREPARE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleDownRemainingEngineState.COMPLETE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.elastic_ep.elastic_state.ScaleDownRemovingEngineState", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ScaleDownRemovingEngineState.PREPARE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleDownRemovingEngineState.EPLB_RESHUFFLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleDownRemovingEngineState.COMPLETE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.elastic_ep.elastic_state.ScaleUpNewEngineState", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ScaleUpNewEngineState.PREPARE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleUpNewEngineState.EPLB_RESHUFFLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleUpNewEngineState.COMPLETE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.elastic_ep.elastic_state.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.elastic_ep.elastic_state", "names": [ "vllm.distributed.elastic_ep.elastic_state.ElasticEPScalingState", "vllm.distributed.elastic_ep.elastic_state.ScaleDownRemainingEngineState", "vllm.distributed.elastic_ep.elastic_state.ScaleDownRemovingEngineState", "vllm.distributed.elastic_ep.elastic_state.ScaleUpExistingEngineState", "vllm.distributed.elastic_ep.elastic_state.ScaleUpNewEngineState", "vllm.distributed.elastic_ep.elastic_state.WorkerType", "vllm.distributed.elastic_ep.elastic_state.logger" ], "n_typable": 50, "n_typed": 22, "n_any": 0, "n_untyped": 28, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 15, "n_classes": 5, "n_attrs": 33, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/distributed/elastic_ep/standby_state.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.elastic_ep.standby_state.pop_standby_groups", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.elastic_ep.standby_state.get_standby_dp_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.elastic_ep.standby_state.create_standby_groups", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.distributed.elastic_ep.standby_state.get_standby_eplb_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.elastic_ep.standby_state.get_standby_world_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.elastic_ep.standby_state.get_standby_ep_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.distributed.elastic_ep.standby_state", "names": [ "vllm.distributed.elastic_ep.standby_state.create_standby_groups", "vllm.distributed.elastic_ep.standby_state.get_standby_dp_group", "vllm.distributed.elastic_ep.standby_state.get_standby_ep_group", "vllm.distributed.elastic_ep.standby_state.get_standby_eplb_group", "vllm.distributed.elastic_ep.standby_state.get_standby_world_group", "vllm.distributed.elastic_ep.standby_state.pop_standby_groups" ], "n_typable": 14, "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 8, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/eplb/async_worker.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.eplb.async_worker.start_async_worker", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.distributed.eplb.async_worker.transfer_run_periodically", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.distributed.eplb.async_worker.run_rebalance_experts", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.distributed.eplb.async_worker.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.eplb.async_worker", "names": [ "vllm.distributed.eplb.async_worker.logger", "vllm.distributed.eplb.async_worker.run_rebalance_experts", "vllm.distributed.eplb.async_worker.start_async_worker", "vllm.distributed.eplb.async_worker.transfer_run_periodically" ], "n_typable": 13, "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 9, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/eplb/eplb_state.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.eplb.eplb_state.EplbStats", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EplbStats.global_expert_load_window", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbStats.num_replicas", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbStats.num_groups", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbStats.num_nodes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbStats.num_gpus", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.eplb.eplb_state.EplbLayerState", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EplbLayerState.expert_load_view", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbLayerState.logical_to_physical_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbLayerState.logical_replica_count", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.eplb.eplb_state.EplbModelState", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EplbModelState.physical_to_logical_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.logical_to_physical_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.logical_replica_count", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.expert_load_pass", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.expert_load_window", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.model_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.expert_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.buffer_lock", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.buffer_ready_event", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.buffer_consumed_event", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.window_ready_event", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.ep_buffer_ready", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.layer_to_transfer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.rebalanced", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.pending_global_ready_check", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.eplb_stats", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.is_unchanged", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.is_received_locally", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.recv_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.cuda_device_index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.new_physical_to_logical_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.new_logical_to_physical_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EplbModelState.new_logical_replica_count", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 24, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.eplb.eplb_state.EplbState", "methods": [ { "kind": "function", "name": "EplbState.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EplbState.build_initial_global_physical_to_logical_map", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EplbState.validate_ep_configuration", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EplbState.add_model", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EplbState.step", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EplbState.rearrange", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EplbState.start_async_loop", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EplbState._update_layer_mapping_from_new", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EplbState._all_ranks_buffer_ready", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EplbState.move_to_workspace", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EplbState.post_eplb", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EplbState._allreduce_list", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EplbState._sync_load_pass", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EplbState.from_mapping", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EplbState.parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EplbState.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EplbState.model_states", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EplbState.policy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EplbState.expert_load_window_step", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EplbState.expert_load_window_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EplbState.expert_rearrangement_step", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EplbState.expert_rearrangement_step_interval", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EplbState.is_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EplbState.rearrange_event", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EplbState.async_worker", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EplbState.cuda_device_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EplbState.num_valid_physical_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 56, "n_typed": 48, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 29, "n_attrs": 13, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.eplb.eplb_state.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.eplb.eplb_state", "names": [ "vllm.distributed.eplb.eplb_state.EplbLayerState", "vllm.distributed.eplb.eplb_state.EplbModelState", "vllm.distributed.eplb.eplb_state.EplbState", "vllm.distributed.eplb.eplb_state.EplbStats", "vllm.distributed.eplb.eplb_state.logger" ], "n_typable": 57, "n_typed": 48, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 29, "n_classes": 4, "n_attrs": 46, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/eplb/eplb_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.eplb.eplb_utils.override_envs_for_eplb", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.distributed.eplb.eplb_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.eplb.eplb_utils", "names": [ "vllm.distributed.eplb.eplb_utils.logger", "vllm.distributed.eplb.eplb_utils.override_envs_for_eplb" ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/eplb/policy/__init__.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.distributed.eplb.policy.EPLB_POLICIES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.distributed.eplb.policy", "names": [ "vllm.distributed.eplb.policy.EPLB_POLICIES" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/eplb/policy/default.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.eplb.policy.default.DefaultEplbPolicy", "methods": [ { "kind": "function", "name": "DefaultEplbPolicy.balanced_packing", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DefaultEplbPolicy.replicate_experts", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DefaultEplbPolicy.rebalance_experts_hierarchical", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DefaultEplbPolicy.preserve_intragpu_slots", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DefaultEplbPolicy.rebalance_experts", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [], "n_typable": 24, "n_typed": 24, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 19, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.eplb.policy.default", "names": [ "vllm.distributed.eplb.policy.default.DefaultEplbPolicy" ], "n_typable": 24, "n_typed": 24, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 19, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/eplb/policy/abstract.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.eplb.policy.abstract.AbstractEplbPolicy", "methods": [ { "kind": "function", "name": "AbstractEplbPolicy.rebalance_experts", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.eplb.policy.abstract", "names": [ "vllm.distributed.eplb.policy.abstract.AbstractEplbPolicy" ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/eplb/rebalance_execute.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.eplb.rebalance_execute.transfer_layer", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.distributed.eplb.rebalance_execute.move_from_buffer", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "class", "name": "vllm.distributed.eplb.rebalance_execute.RecvMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RecvMetadata.recv_primary_mask", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RecvMetadata.recv_count", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RecvMetadata.recv_expert_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RecvMetadata.recv_dst_rows", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.eplb.rebalance_execute", "names": [ "vllm.distributed.eplb.rebalance_execute.RecvMetadata", "vllm.distributed.eplb.rebalance_execute.move_from_buffer", "vllm.distributed.eplb.rebalance_execute.transfer_layer" ], "n_typable": 17, "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 15, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_events.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.kv_events.NullEventPublisher", "methods": [ { "kind": "function", "name": "NullEventPublisher.publish", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NullEventPublisher.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_events.KVEventBatch", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KVEventBatch.events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_events.MEDIUM_GPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.distributed.kv_events.BlockRemoved", "methods": [ { "kind": "function", "name": "BlockRemoved.__hash__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlockRemoved.block_hashes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BlockRemoved.medium", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_events.AllBlocksCleared", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_events.EventPublisher", "methods": [ { "kind": "function", "name": "EventPublisher.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EventPublisher.publish", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EventPublisher.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_events.KVCacheEvent", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_events.KVEventAggregator", "methods": [ { "kind": "function", "name": "KVEventAggregator.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVEventAggregator.add_events", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVEventAggregator.get_common_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVEventAggregator.get_all_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVEventAggregator.clear_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVEventAggregator.increment_workers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVEventAggregator.reset_workers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVEventAggregator.get_number_of_workers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVEventAggregator.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_events.EventPublisherFactory", "methods": [ { "kind": "function", "name": "EventPublisherFactory.register_publisher", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EventPublisherFactory.create", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EventPublisherFactory._registry", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_events.KVConnectorKVEvents", "methods": [ { "kind": "function", "name": "KVConnectorKVEvents.add_events", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorKVEvents.aggregate", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorKVEvents.increment_workers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorKVEvents.get_all_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorKVEvents.get_number_of_workers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorKVEvents.clear_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorKVEvents.merge", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_events.EventBatch", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EventBatch.ts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EventBatch.events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EventBatch.data_parallel_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_events.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.kv_events.BlockStored", "methods": [ { "kind": "function", "name": "BlockStored.__hash__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlockStored.block_hashes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BlockStored.parent_block_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BlockStored.token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BlockStored.block_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BlockStored.lora_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BlockStored.medium", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BlockStored.lora_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BlockStored.extra_keys", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_events.ZmqEventPublisher", "methods": [ { "kind": "function", "name": "ZmqEventPublisher.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "ZmqEventPublisher.publish", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ZmqEventPublisher.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ZmqEventPublisher._socket_setup", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ZmqEventPublisher._publisher_thread", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ZmqEventPublisher._service_replay", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ZmqEventPublisher.offset_endpoint_port", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ZmqEventPublisher.SHUTDOWN_TIMEOUT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ZmqEventPublisher.END_SEQ", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 10, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] } ], "name": "vllm.distributed.kv_events", "names": [ "vllm.distributed.kv_events.AllBlocksCleared", "vllm.distributed.kv_events.BlockRemoved", "vllm.distributed.kv_events.BlockStored", "vllm.distributed.kv_events.EventBatch", "vllm.distributed.kv_events.EventPublisher", "vllm.distributed.kv_events.EventPublisherFactory", "vllm.distributed.kv_events.KVCacheEvent", "vllm.distributed.kv_events.KVConnectorKVEvents", "vllm.distributed.kv_events.KVEventAggregator", "vllm.distributed.kv_events.KVEventBatch", "vllm.distributed.kv_events.MEDIUM_GPU", "vllm.distributed.kv_events.NullEventPublisher", "vllm.distributed.kv_events.ZmqEventPublisher", "vllm.distributed.kv_events.logger" ], "n_typable": 73, "n_typed": 70, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 32, "n_method_overloads": 32, "n_method_params": 23, "n_classes": 12, "n_attrs": 19, "n_properties": 0, "n_type_ignores": 6 }, { "path": "vllm/distributed/kv_transfer/kv_transfer_state.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_transfer_state.is_v1_kv_transfer_group", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_transfer_state.ensure_kv_transfer_shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_transfer_state.ensure_kv_transfer_initialized", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_transfer_state.get_kv_transfer_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_transfer_state.has_kv_transfer_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_transfer_state", "names": [ "vllm.distributed.kv_transfer.kv_transfer_state.ensure_kv_transfer_initialized", "vllm.distributed.kv_transfer.kv_transfer_state.ensure_kv_transfer_shutdown", "vllm.distributed.kv_transfer.kv_transfer_state.get_kv_transfer_group", "vllm.distributed.kv_transfer.kv_transfer_state.has_kv_transfer_group", "vllm.distributed.kv_transfer.kv_transfer_state.is_v1_kv_transfer_group" ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/base.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.base.KVConnectorBase_V1", "methods": [ { "kind": "function", "name": "KVConnectorBase_V1.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KVConnectorBase_V1.bind_connector_metadata", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorBase_V1.clear_connector_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorBase_V1._get_connector_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorBase_V1.has_connector_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorBase_V1.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorBase_V1.register_cross_layers_kv_cache", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KVConnectorBase_V1.set_host_xfer_buffer_ops", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorBase_V1.handle_preemptions", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorBase_V1.start_load_kv", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KVConnectorBase_V1.wait_for_layer_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorBase_V1.save_kv_layer", "n_typed": 4, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KVConnectorBase_V1.wait_for_save", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorBase_V1.get_finished", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorBase_V1.get_block_ids_with_load_errors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorBase_V1.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorBase_V1.get_kv_connector_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorBase_V1.get_kv_connector_kv_cache_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorBase_V1.get_handshake_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorBase_V1.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KVConnectorBase_V1.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KVConnectorBase_V1.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorBase_V1.update_connector_output", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorBase_V1.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KVConnectorBase_V1.take_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorBase_V1.get_required_kvcache_layout", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorBase_V1.requires_piecewise_for_cudagraph", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorBase_V1.get_finished_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorBase_V1.build_kv_connector_stats", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorBase_V1.set_xfer_handshake_metadata", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorBase_V1.build_prom_metrics", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KVConnectorBase_V1.reset_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "KVConnectorBase_V1.prefer_cross_layer_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "KVConnectorBase_V1.role", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 68, "n_typed": 57, "n_any": 2, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 32, "n_method_overloads": 32, "n_method_params": 34, "n_attrs": 0, "n_properties": 2 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.base.KVConnectorRole", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KVConnectorRole.SCHEDULER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVConnectorRole.WORKER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.base.supports_hma", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.base.SupportsHMA", "methods": [ { "kind": "function", "name": "SupportsHMA.request_finished_all_groups", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.base.KVConnectorMetadata", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.base.KVConnectorHandshakeMetadata", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.base.CopyBlocksOp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.base.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.base", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.base.CopyBlocksOp", "vllm.distributed.kv_transfer.kv_connector.v1.base.KVConnectorBase_V1", "vllm.distributed.kv_transfer.kv_connector.v1.base.KVConnectorHandshakeMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.base.KVConnectorMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.base.KVConnectorRole", "vllm.distributed.kv_transfer.kv_connector.v1.base.SupportsHMA", "vllm.distributed.kv_transfer.kv_connector.v1.base.logger", "vllm.distributed.kv_transfer.kv_connector.v1.base.supports_hma" ], "n_typable": 75, "n_typed": 62, "n_any": 3, "n_untyped": 10, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 33, "n_method_overloads": 33, "n_method_params": 36, "n_classes": 5, "n_attrs": 4, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/factory.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.factory.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.factory.KVConnectorFactory", "methods": [ { "kind": "function", "name": "KVConnectorFactory.register_connector", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KVConnectorFactory.create_connector", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KVConnectorFactory.get_connector_class_by_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorFactory._get_connector_class_with_compat", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorFactory.get_connector_class", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KVConnectorFactory._registry", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 15, "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.factory", "names": [ "vllm.distributed.kv_transfer.kv_connector.factory.KVConnectorFactory", "vllm.distributed.kv_transfer.kv_connector.factory.logger" ], "n_typable": 16, "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.utils.kv_postprocess_layout_on_receive", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.utils.TpKVTopology", "methods": [ { "kind": "function", "name": "TpKVTopology.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TpKVTopology.tp_ratio", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TpKVTopology.block_size_ratio", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TpKVTopology.tp_ratio_from_engine_id", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TpKVTopology.block_size_ratio_from_engine_id", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TpKVTopology.is_kv_replicated", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TpKVTopology.replicates_kv_cache", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TpKVTopology.get_target_remote_ranks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TpKVTopology.get_target_remote_ranks_from_engine_id", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "TpKVTopology.is_kv_layout_blocks_first", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "TpKVTopology.split_k_and_v", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "TpKVTopology.tp_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "TpKVTopology.block_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "TpKVTopology.cross_layers_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "TpKVTopology.block_size_position", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "TpKVTopology.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TpKVTopology.remote_tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TpKVTopology.is_mla", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TpKVTopology.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TpKVTopology.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TpKVTopology.engine_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TpKVTopology.remote_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TpKVTopology.tensor_shape", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 23, "n_typed": 22, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 8, "n_attrs": 8, "n_properties": 6 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.utils.kv_postprocess_blksize_and_layout_on_receive", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.utils.get_kv_connector_cache_layout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.utils.KVOutputAggregator", "methods": [ { "kind": "function", "name": "KVOutputAggregator.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVOutputAggregator.from_connector", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KVOutputAggregator.aggregate", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.utils.EngineId", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.utils.get_current_attn_backend", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.utils.copy_kv_blocks", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.utils.kv_postprocess_blksize_on_receive", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.utils.yield_req_data", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.utils", "names": [ "vllm.distributed.kv_transfer.kv_connector.utils.EngineId", "vllm.distributed.kv_transfer.kv_connector.utils.KVOutputAggregator", "vllm.distributed.kv_transfer.kv_connector.utils.TpKVTopology", "vllm.distributed.kv_transfer.kv_connector.utils.copy_kv_blocks", "vllm.distributed.kv_transfer.kv_connector.utils.get_current_attn_backend", "vllm.distributed.kv_transfer.kv_connector.utils.get_kv_connector_cache_layout", "vllm.distributed.kv_transfer.kv_connector.utils.kv_postprocess_blksize_and_layout_on_receive", "vllm.distributed.kv_transfer.kv_connector.utils.kv_postprocess_blksize_on_receive", "vllm.distributed.kv_transfer.kv_connector.utils.kv_postprocess_layout_on_receive", "vllm.distributed.kv_transfer.kv_connector.utils.logger", "vllm.distributed.kv_transfer.kv_connector.utils.yield_req_data" ], "n_typable": 54, "n_typed": 36, "n_any": 0, "n_untyped": 18, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 15, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 13, "n_classes": 2, "n_attrs": 10, "n_properties": 6, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/decode_bench_connector.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.decode_bench_connector.DecodeBenchConnector", "methods": [ { "kind": "function", "name": "DecodeBenchConnector.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DecodeBenchConnector.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DecodeBenchConnector.start_load_kv", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DecodeBenchConnector.wait_for_layer_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DecodeBenchConnector.save_kv_layer", "n_typed": 4, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DecodeBenchConnector.wait_for_save", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DecodeBenchConnector.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DecodeBenchConnector.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DecodeBenchConnector.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DecodeBenchConnector.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DecodeBenchConnector.connector_scheduler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DecodeBenchConnector.connector_worker", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 31, "n_typed": 25, "n_any": 2, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 19, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.decode_bench_connector.DecodeBenchConnectorScheduler", "methods": [ { "kind": "function", "name": "DecodeBenchConnectorScheduler.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DecodeBenchConnectorScheduler.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DecodeBenchConnectorScheduler.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DecodeBenchConnectorScheduler.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DecodeBenchConnectorScheduler.request_finished", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DecodeBenchConnectorScheduler.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DecodeBenchConnectorScheduler.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.decode_bench_connector.DecodeBenchConnectorMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DecodeBenchConnectorMetadata.reqs_to_fill", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.decode_bench_connector.DecodeBenchConnectorWorker", "methods": [ { "kind": "function", "name": "DecodeBenchConnectorWorker.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DecodeBenchConnectorWorker.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DecodeBenchConnectorWorker.start_fill_kv", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DecodeBenchConnectorWorker._fill_blocks", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DecodeBenchConnectorWorker.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DecodeBenchConnectorWorker.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DecodeBenchConnectorWorker.fill_mean", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DecodeBenchConnectorWorker.fill_std", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DecodeBenchConnectorWorker.kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DecodeBenchConnectorWorker.group_to_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 16, "n_typed": 8, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.decode_bench_connector.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.decode_bench_connector", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.decode_bench_connector.DecodeBenchConnector", "vllm.distributed.kv_transfer.kv_connector.v1.decode_bench_connector.DecodeBenchConnectorMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.decode_bench_connector.DecodeBenchConnectorScheduler", "vllm.distributed.kv_transfer.kv_connector.v1.decode_bench_connector.DecodeBenchConnectorWorker", "vllm.distributed.kv_transfer.kv_connector.v1.decode_bench_connector.logger" ], "n_typable": 63, "n_typed": 43, "n_any": 2, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 33, "n_classes": 4, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/example_connector.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.example_connector.ExampleConnector", "methods": [ { "kind": "function", "name": "ExampleConnector.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ExampleConnector.start_load_kv", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExampleConnector.wait_for_layer_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExampleConnector.save_kv_layer", "n_typed": 4, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ExampleConnector.wait_for_save", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ExampleConnector.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExampleConnector.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ExampleConnector.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExampleConnector._found_match_for_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExampleConnector._found_match_for_prompt", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExampleConnector._generate_foldername_debug", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ExampleConnector._generate_filename_debug", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 37, "n_typed": 31, "n_any": 2, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 25, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.example_connector.ReqMeta", "methods": [ { "kind": "function", "name": "ReqMeta.make_meta", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ReqMeta.token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.is_store", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.mm_hashes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.example_connector.ExampleConnectorMetadata", "methods": [ { "kind": "function", "name": "ExampleConnectorMetadata.add_request", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExampleConnectorMetadata.requests", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.example_connector.align_to_block_size", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.example_connector.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.example_connector", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.example_connector.ExampleConnector", "vllm.distributed.kv_transfer.kv_connector.v1.example_connector.ExampleConnectorMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.example_connector.ReqMeta", "vllm.distributed.kv_transfer.kv_connector.v1.example_connector.align_to_block_size", "vllm.distributed.kv_transfer.kv_connector.v1.example_connector.logger" ], "n_typable": 53, "n_typed": 45, "n_any": 2, "n_untyped": 6, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 35, "n_classes": 3, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/example_hidden_states_connector.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.example_hidden_states_connector.ReqMeta", "methods": [ { "kind": "function", "name": "ReqMeta.make_meta", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ReqMeta.req_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.filename", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.new_req", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.example_hidden_states_connector.ExampleHiddenStatesConnector", "methods": [ { "kind": "function", "name": "ExampleHiddenStatesConnector.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ExampleHiddenStatesConnector.start_load_kv", "n_typed": 1, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExampleHiddenStatesConnector.wait_for_layer_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExampleHiddenStatesConnector.wait_for_save", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ExampleHiddenStatesConnector.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExampleHiddenStatesConnector.save_kv_layer", "n_typed": 4, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ExampleHiddenStatesConnector.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExampleHiddenStatesConnector.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ExampleHiddenStatesConnector.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExampleHiddenStatesConnector.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExampleHiddenStatesConnector.get_required_kvcache_layout", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "ExampleHiddenStatesConnector.prefer_cross_layer_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ExampleHiddenStatesConnector.cache_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ExampleHiddenStatesConnector.num_hidden_states", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 26, "n_any": 2, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 20, "n_attrs": 2, "n_properties": 1 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.example_hidden_states_connector.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.example_hidden_states_connector.ExampleHiddenStatesConnectorMetadata", "methods": [ { "kind": "function", "name": "ExampleHiddenStatesConnectorMetadata.add_request", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExampleHiddenStatesConnectorMetadata.requests", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.example_hidden_states_connector.extract_from_kv_cache", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.example_hidden_states_connector", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.example_hidden_states_connector.ExampleHiddenStatesConnector", "vllm.distributed.kv_transfer.kv_connector.v1.example_hidden_states_connector.ExampleHiddenStatesConnectorMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.example_hidden_states_connector.ReqMeta", "vllm.distributed.kv_transfer.kv_connector.v1.example_hidden_states_connector.extract_from_kv_cache", "vllm.distributed.kv_transfer.kv_connector.v1.example_hidden_states_connector.logger" ], "n_typable": 53, "n_typed": 44, "n_any": 2, "n_untyped": 7, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 32, "n_classes": 3, "n_attrs": 9, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/lmcache_connector.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_connector.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_connector.LMCacheConnectorV1", "methods": [ { "kind": "function", "name": "LMCacheConnectorV1.requires_piecewise_for_cudagraph", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheConnectorV1.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LMCacheConnectorV1.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheConnectorV1.start_load_kv", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LMCacheConnectorV1.wait_for_layer_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheConnectorV1.save_kv_layer", "n_typed": 4, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LMCacheConnectorV1.wait_for_save", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheConnectorV1.get_finished", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheConnectorV1.get_block_ids_with_load_errors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheConnectorV1.get_kv_connector_kv_cache_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheConnectorV1.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LMCacheConnectorV1.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LMCacheConnectorV1.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheConnectorV1.update_connector_output", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheConnectorV1.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LMCacheConnectorV1.take_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 38, "n_typed": 31, "n_any": 2, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 22, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_connector.LMCacheKVEvents", "methods": [ { "kind": "function", "name": "LMCacheKVEvents.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheKVEvents.add_events", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheKVEvents.aggregate", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheKVEvents.increment_workers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheKVEvents.get_all_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheKVEvents.get_number_of_workers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheKVEvents.clear_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheKVEvents.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_connector", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_connector.LMCacheConnectorV1", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_connector.LMCacheKVEvents", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_connector.logger" ], "n_typable": 50, "n_typed": 42, "n_any": 2, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 24, "n_method_overloads": 24, "n_method_params": 25, "n_classes": 2, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/lmcache_integration/multi_process_adapter.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.LMCacheMPWorkerAdapter", "methods": [ { "kind": "function", "name": "LMCacheMPWorkerAdapter.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "LMCacheMPWorkerAdapter.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPWorkerAdapter.submit_store_request", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LMCacheMPWorkerAdapter.submit_retrieve_request", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LMCacheMPWorkerAdapter.batched_submit_store_requests", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LMCacheMPWorkerAdapter.batched_submit_retrieve_requests", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LMCacheMPWorkerAdapter.get_finished", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPWorkerAdapter.num_blocks_per_chunk", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPWorkerAdapter.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPWorkerAdapter._update_and_get_finished_store", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPWorkerAdapter._create_key", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LMCacheMPWorkerAdapter._create_hash_key", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LMCacheMPWorkerAdapter.mq_client", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPWorkerAdapter.instance_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPWorkerAdapter.kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPWorkerAdapter.store_futures", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPWorkerAdapter.retrieve_futures", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPWorkerAdapter.finished_stores", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPWorkerAdapter.previously_finished", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPWorkerAdapter.model_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPWorkerAdapter.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPWorkerAdapter.worker_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPWorkerAdapter.blocks_in_chunk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 49, "n_typed": 36, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 26, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.LMCacheMPSchedulerAdapter", "methods": [ { "kind": "function", "name": "LMCacheMPSchedulerAdapter.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "LMCacheMPSchedulerAdapter.maybe_submit_lookup_request", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LMCacheMPSchedulerAdapter.check_lookup_result", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPSchedulerAdapter.num_blocks_per_chunk", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPSchedulerAdapter.cleanup_lookup_result", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPSchedulerAdapter.end_session", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPSchedulerAdapter._create_key", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LMCacheMPSchedulerAdapter._create_hash_key", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LMCacheMPSchedulerAdapter.mq_client", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPSchedulerAdapter.lookup_futures", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPSchedulerAdapter.model_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPSchedulerAdapter.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPSchedulerAdapter.worker_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPSchedulerAdapter.chunk_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPSchedulerAdapter.blocks_in_chunk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 26, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 18, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.LoadStoreOp", "methods": [ { "kind": "function", "name": "LoadStoreOp.__len__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LoadStoreOp.block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoadStoreOp.token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoadStoreOp.block_hashes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoadStoreOp.start", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoadStoreOp.end", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.get_lmcache_chunk_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.StoreResult", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.RetrieveResult", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.striding_block_hashes", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.wrap_kv_caches", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.send_lmcache_request", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.LookupResult", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.LMCacheMPSchedulerAdapter", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.LMCacheMPWorkerAdapter", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.LoadStoreOp", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.LookupResult", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.RetrieveResult", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.StoreResult", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.get_lmcache_chunk_size", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.logger", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.send_lmcache_request", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.striding_block_hashes", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.multi_process_adapter.wrap_kv_caches" ], "n_typable": 95, "n_typed": 74, "n_any": 0, "n_untyped": 21, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 7, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 44, "n_classes": 3, "n_attrs": 27, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/lmcache_integration/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.hex_hash_to_int16", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.create_lmcache_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.mla_enabled", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.ENGINE_NAME", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.apply_mm_hashes_to_token_ids", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.lmcache_get_or_create_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.extract_mm_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.is_false", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.ENGINE_NAME", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.apply_mm_hashes_to_token_ids", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.create_lmcache_metadata", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.extract_mm_features", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.hex_hash_to_int16", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.is_false", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.lmcache_get_or_create_config", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.logger", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.utils.mla_enabled" ], "n_typable": 20, "n_typed": 14, "n_any": 0, "n_untyped": 6, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 12, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/lmcache_integration/vllm_v1_adapter.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.need_gpu_interm_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.SaveSpec", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SaveSpec.skip_leading_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SaveSpec.can_save", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.extract_request_configs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.tmp_disagg_tracker", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.ReqMeta", "methods": [ { "kind": "function", "name": "ReqMeta.from_request_tracker", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ReqMeta.req_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.is_last_prefill", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.save_spec", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.load_spec", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.disagg_spec", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.request_configs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.LMCacheConnectorV1Impl", "methods": [ { "kind": "function", "name": "LMCacheConnectorV1Impl.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LMCacheConnectorV1Impl.get_inference_info", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheConnectorV1Impl.get_inference_version", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheConnectorV1Impl._init_kv_caches_from_forward_context", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheConnectorV1Impl.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheConnectorV1Impl.start_load_kv", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LMCacheConnectorV1Impl.wait_for_layer_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheConnectorV1Impl.save_kv_layer", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LMCacheConnectorV1Impl.wait_for_save", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheConnectorV1Impl.get_finished", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheConnectorV1Impl.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LMCacheConnectorV1Impl.update_state_after_alloc", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LMCacheConnectorV1Impl.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheConnectorV1Impl.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LMCacheConnectorV1Impl.kv_role", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.worker_count", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.async_loading", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.layerwise_retrievers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.load_specs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.kv_cache_manager", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.skip_last_n_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.num_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.current_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.force_skip_save", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.lookup_client", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.lmcache_engine", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.api_server", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.plugin_launcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.use_layerwise", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.enable_blending", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.lookup_server", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.offload_server", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheConnectorV1Impl.blender", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 55, "n_typed": 31, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 20, "n_attrs": 21, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.DisaggSpec", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DisaggSpec.req_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DisaggSpec.receiver_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DisaggSpec.receiver_host", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DisaggSpec.receiver_init_port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DisaggSpec.receiver_alloc_port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DisaggSpec.is_last_prefill", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DisaggSpec.num_transferred_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.RequestTracker", "methods": [ { "kind": "function", "name": "RequestTracker.from_new_request", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "RequestTracker.update", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RequestTracker.req_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestTracker.prompt_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestTracker.token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestTracker.allocated_block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestTracker.num_saved_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestTracker.disagg_spec", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestTracker.mm_hashes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestTracker.mm_positions", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestTracker.request_configs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestTracker.is_decode_phase", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestTracker.skip_save", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.LMCacheConnectorMetadata", "methods": [ { "kind": "function", "name": "LMCacheConnectorMetadata.add_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LMCacheConnectorMetadata.requests", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LMCacheConnectorMetadata.lookup_requests_in_step", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.LoadSpec", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LoadSpec.vllm_cached_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoadSpec.lmcache_cached_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoadSpec.can_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.DisaggSpec", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.LMCacheConnectorMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.LMCacheConnectorV1Impl", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.LoadSpec", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.ReqMeta", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.RequestTracker", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.SaveSpec", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.extract_request_configs", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.logger", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.need_gpu_interm_buffer", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration.vllm_v1_adapter.tmp_disagg_tracker" ], "n_typable": 79, "n_typed": 53, "n_any": 0, "n_untyped": 26, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 2, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 34, "n_classes": 7, "n_attrs": 56, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/lmcache_mp_connector.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.create_scheduler_adapter", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.LMCacheMPRequestState", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LMCacheMPRequestState.PREFETCHING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LMCacheMPRequestState.WAITING_FOR_LOAD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LMCacheMPRequestState.READY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.reformat_block_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.LMCacheMPRequestMetadata", "methods": [ { "kind": "function", "name": "LMCacheMPRequestMetadata.GetStoreMetadata", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LMCacheMPRequestMetadata.GetRetrieveMetadata", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LMCacheMPRequestMetadata.request_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LMCacheMPRequestMetadata.direction", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LMCacheMPRequestMetadata.op", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.LMCacheMPRequestTracker", "methods": [ { "kind": "function", "name": "LMCacheMPRequestTracker.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPRequestTracker.needs_retrieve", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPRequestTracker.is_ready_for_retrieving", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPRequestTracker.increase_num_scheduled_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPRequestTracker.increase_num_stored_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPRequestTracker.append_block_ids", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPRequestTracker.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPRequestTracker.__str__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LMCacheMPRequestTracker.request_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LMCacheMPRequestTracker.all_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LMCacheMPRequestTracker.block_hashes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LMCacheMPRequestTracker.allocated_block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LMCacheMPRequestTracker.num_scheduled_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LMCacheMPRequestTracker.num_stored_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LMCacheMPRequestTracker.num_vllm_hit_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LMCacheMPRequestTracker.num_lmcache_hit_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LMCacheMPRequestTracker.state", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 4, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.LMCacheMPConnectorMetadata", "methods": [ { "kind": "function", "name": "LMCacheMPConnectorMetadata.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPConnectorMetadata.add_request_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPConnectorMetadata.__len__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPConnectorMetadata.__str__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPConnectorMetadata.__repr__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LMCacheMPConnectorMetadata.requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 2, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.create_worker_adapter", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.extract_world_size_and_kv_rank", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.LMCacheMPConnector", "methods": [ { "kind": "function", "name": "LMCacheMPConnector.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LMCacheMPConnector._get_connector_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPConnector.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPConnector.start_load_kv", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LMCacheMPConnector.wait_for_layer_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPConnector.save_kv_layer", "n_typed": 4, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LMCacheMPConnector.wait_for_save", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPConnector.get_finished", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPConnector.get_block_ids_with_load_errors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPConnector.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPConnector.get_kv_connector_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPConnector.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LMCacheMPConnector.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LMCacheMPConnector.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPConnector.update_connector_output", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPConnector.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LMCacheMPConnector.take_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPConnector.get_required_kvcache_layout", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPConnector.get_finished_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMCacheMPConnector.build_kv_connector_stats", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPConnector.build_prom_metrics", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LMCacheMPConnector._process_retrieve_requests", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPConnector._process_new_requests", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LMCacheMPConnector._process_cached_requests", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LMCacheMPConnector._get_request_tracker", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPConnector._get_or_create_request_tracker", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMCacheMPConnector._cleanup_request_tracker", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "LMCacheMPConnector.role", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "LMCacheMPConnector.vllm_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPConnector.scheduler_adapter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPConnector.request_trackers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LMCacheMPConnector.worker_adapter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 67, "n_typed": 56, "n_any": 2, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 27, "n_method_overloads": 27, "n_method_params": 35, "n_attrs": 4, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.LMCacheMPConnector", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.LMCacheMPConnectorMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.LMCacheMPRequestMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.LMCacheMPRequestState", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.LMCacheMPRequestTracker", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.create_scheduler_adapter", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.create_worker_adapter", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.extract_world_size_and_kv_rank", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.logger", "vllm.distributed.kv_transfer.kv_connector.v1.lmcache_mp_connector.reformat_block_ids" ], "n_typable": 109, "n_typed": 88, "n_any": 2, "n_untyped": 19, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 10, "n_methods": 42, "n_method_overloads": 42, "n_method_params": 46, "n_classes": 5, "n_attrs": 21, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/metrics.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.metrics.KVConnectorPromMetrics", "methods": [ { "kind": "function", "name": "KVConnectorPromMetrics.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KVConnectorPromMetrics.make_per_engine", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorPromMetrics.observe", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KVConnectorPromMetrics.per_engine_labelvalues", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.metrics.KVConnectorLogging", "methods": [ { "kind": "function", "name": "KVConnectorLogging.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorLogging.reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorLogging.observe", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorLogging.log", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KVConnectorLogging.connector_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 2, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.metrics.KVConnectorStats", "methods": [ { "kind": "function", "name": "KVConnectorStats.reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorStats.aggregate", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnectorStats.reduce", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorStats.is_empty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KVConnectorStats.data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.metrics.KVConnectorPrometheus", "methods": [ { "kind": "function", "name": "KVConnectorPrometheus.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KVConnectorPrometheus.observe", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KVConnectorPrometheus._gauge_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVConnectorPrometheus._counter_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVConnectorPrometheus._histogram_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVConnectorPrometheus.prom_metrics", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.metrics.PromMetric", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.metrics.PromMetricT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.metrics.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.metrics", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.metrics.KVConnectorLogging", "vllm.distributed.kv_transfer.kv_connector.v1.metrics.KVConnectorPromMetrics", "vllm.distributed.kv_transfer.kv_connector.v1.metrics.KVConnectorPrometheus", "vllm.distributed.kv_transfer.kv_connector.v1.metrics.KVConnectorStats", "vllm.distributed.kv_transfer.kv_connector.v1.metrics.PromMetric", "vllm.distributed.kv_transfer.kv_connector.v1.metrics.PromMetricT", "vllm.distributed.kv_transfer.kv_connector.v1.metrics.logger" ], "n_typable": 34, "n_typed": 21, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 16, "n_classes": 4, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/mooncake/mooncake_connector.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.MooncakeConnectorMetadata", "methods": [ { "kind": "function", "name": "MooncakeConnectorMetadata.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MooncakeConnectorMetadata.add_new_req", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MooncakeConnectorMetadata.reqs_to_recv", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorMetadata.reqs_to_send", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorMetadata.reqs_not_processed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.get_mooncake_bootstrap_addr", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.should_launch_bootstrap_server", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.ReqId", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.MooncakeConnectorWorker", "methods": [ { "kind": "function", "name": "MooncakeConnectorWorker.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MooncakeConnectorWorker.__del__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MooncakeConnectorWorker.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MooncakeConnectorWorker.register_worker_with_bootstrap", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MooncakeConnectorWorker._mooncake_sender_listener", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MooncakeConnectorWorker._sender_worker", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MooncakeConnectorWorker.send_kv_to_decode", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MooncakeConnectorWorker.resolve_need_send", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MooncakeConnectorWorker._build_transfer_params", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MooncakeConnectorWorker._send_blocks", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MooncakeConnectorWorker.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MooncakeConnectorWorker.fetch_finished_recving_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MooncakeConnectorWorker.fetch_finished_sending_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MooncakeConnectorWorker.get_finished", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MooncakeConnectorWorker.receive_kv_from_single_worker", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MooncakeConnectorWorker.process_pulling_result", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MooncakeConnectorWorker._connect_to_prefiller_bootstrap", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MooncakeConnectorWorker.receive_kv", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MooncakeConnectorWorker.handle_new_engine_id", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MooncakeConnectorWorker._start_load_kv", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MooncakeConnectorWorker.record_send_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MooncakeConnectorWorker.start_load_kv", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MooncakeConnectorWorker.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.engine", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.hostname", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.is_kv_producer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.is_kv_consumer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.num_sender_workers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.num_sender_tasks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.rpc_port", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.side_channel_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.engine_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.num_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.dp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.pp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.kv_caches_base_addr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.device_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.reqs_need_send", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.finished_sending_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.finished_recving_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.use_mla", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.backend_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.kv_cache_layout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.kv_topo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.async_zmq_ctx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.sender_worker_queue", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.sender_loop", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.receiver_loop", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorWorker.bootstrap_server", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 82, "n_typed": 42, "n_any": 0, "n_untyped": 40, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 22, "n_method_overloads": 22, "n_method_params": 28, "n_attrs": 32, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.group_concurrent_contiguous", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.MooncakeXferMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MooncakeXferMetadata.remote_hostname", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeXferMetadata.remote_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeXferMetadata.remote_tp_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeXferMetadata.remote_tp_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeXferMetadata.req_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeXferMetadata.kv_caches_base_addr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.get_mooncake_side_channel_port", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.TransferId", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.PullReqMeta", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PullReqMeta.d_req_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PullReqMeta.transfer_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PullReqMeta.local_block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PullReqMeta.remote_engine_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PullReqMeta.remote_bootstrap_addr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PullReqMeta.expire_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PullReqMeta.pull_tasks_count", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.MooncakeConnectorScheduler", "methods": [ { "kind": "function", "name": "MooncakeConnectorScheduler.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MooncakeConnectorScheduler.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MooncakeConnectorScheduler.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MooncakeConnectorScheduler.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MooncakeConnectorScheduler.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MooncakeConnectorScheduler.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorScheduler.is_kv_producer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnectorScheduler.is_kv_consumer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 18, "n_typed": 15, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.MooncakeXferResponseStatus", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MooncakeXferResponseStatus.FINISH", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MooncakeXferResponseStatus.CONTINUE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MooncakeXferResponseStatus.ERROR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.MooncakeXferResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MooncakeXferResponse.status", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeXferResponse.ok_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeXferResponse.err_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeXferResponse.err_msg", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.MooncakeConnector", "methods": [ { "kind": "function", "name": "MooncakeConnector.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MooncakeConnector.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MooncakeConnector.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MooncakeConnector.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MooncakeConnector.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MooncakeConnector.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MooncakeConnector.get_finished", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MooncakeConnector.start_load_kv", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MooncakeConnector.wait_for_layer_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MooncakeConnector.save_kv_layer", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MooncakeConnector.wait_for_save", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MooncakeConnector.engine_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnector.connector_scheduler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeConnector.connector_worker", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 34, "n_typed": 28, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 20, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.SendBlockMeta", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SendBlockMeta.p_req_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SendBlockMeta.transfer_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SendBlockMeta.local_block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SendBlockMeta.ready", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SendBlockMeta.expire_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SendBlockMeta.need_send", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SendBlockMeta.sent", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SendBlockMeta.sending", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] } ], "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.MooncakeConnector", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.MooncakeConnectorMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.MooncakeConnectorScheduler", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.MooncakeConnectorWorker", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.MooncakeXferMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.MooncakeXferResponse", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.MooncakeXferResponseStatus", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.PullReqMeta", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.ReqId", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.SendBlockMeta", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.TransferId", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.get_mooncake_bootstrap_addr", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.get_mooncake_side_channel_port", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.group_concurrent_contiguous", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.logger", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_connector.should_launch_bootstrap_server" ], "n_typable": 163, "n_typed": 111, "n_any": 0, "n_untyped": 52, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 5, "n_methods": 40, "n_method_overloads": 40, "n_method_params": 62, "n_classes": 9, "n_attrs": 72, "n_properties": 0, "n_type_ignores": 2 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/mooncake/mooncake_utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_utils.EngineEntry", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EngineEntry.engine_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineEntry.worker_addr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_utils.RegisterWorkerPayload", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RegisterWorkerPayload.engine_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RegisterWorkerPayload.dp_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RegisterWorkerPayload.tp_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RegisterWorkerPayload.pp_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RegisterWorkerPayload.addr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_utils.MooncakeBootstrapServer", "methods": [ { "kind": "function", "name": "MooncakeBootstrapServer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MooncakeBootstrapServer.__del__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MooncakeBootstrapServer._register_routes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MooncakeBootstrapServer.start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MooncakeBootstrapServer.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MooncakeBootstrapServer.register_worker", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MooncakeBootstrapServer.query", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MooncakeBootstrapServer.workers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeBootstrapServer.host", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeBootstrapServer.port", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeBootstrapServer.app", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeBootstrapServer.server_thread", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MooncakeBootstrapServer.server", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 17, "n_typed": 8, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 4, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_utils.WorkerAddr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_utils", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_utils.EngineEntry", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_utils.MooncakeBootstrapServer", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_utils.RegisterWorkerPayload", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_utils.WorkerAddr", "vllm.distributed.kv_transfer.kv_connector.v1.mooncake.mooncake_utils.logger" ], "n_typable": 23, "n_typed": 13, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 4, "n_classes": 3, "n_attrs": 15, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/moriio/moriio_common.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.MoRIIOConfig", "methods": [ { "kind": "function", "name": "MoRIIOConfig.from_vllm_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoRIIOConfig.local_ip", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConfig.local_kv_port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConfig.proxy_ip", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConfig.local_ping_port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConfig.proxy_ping_port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConfig.http_port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConfig.handshake_port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConfig.notify_port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConfig.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConfig.dp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConfig.dp_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConfig.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 12, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.zmq_ctx", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.HandshakeError", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.ReqId", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.RemoteAllocInfo", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RemoteAllocInfo.block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RemoteAllocInfo.writes_done", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RemoteAllocInfo.decode_dp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RemoteAllocInfo.transfer_offset", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.LayerTransferPlan", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LayerTransferPlan.request_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerTransferPlan.layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerTransferPlan.sess_idx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerTransferPlan.transfer_local_offsets", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerTransferPlan.transfer_remote_offsets", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerTransferPlan.transfer_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerTransferPlan.use_batch", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.Transfer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.MoRIIOConstants", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MoRIIOConstants.GET_META_MSG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConstants.POP_DONE_RECV", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConstants.OVER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConstants.COMPLETION_PREFIX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConstants.PING_INTERVAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConstants.MAX_PING_RETRIES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConstants.DEFAULT_HANDSHAKE_PORT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConstants.DEFAULT_NOTIFY_PORT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOConstants.VLLM_MORI_READ_ABORT_REQUEST_TIMEOUT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 9, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.EngineId", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.MoRIIOAgentMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MoRIIOAgentMetadata.engine_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOAgentMetadata.agent_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOAgentMetadata.kv_caches_base_addr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOAgentMetadata.num_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOAgentMetadata.block_len", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOAgentMetadata.attn_backend_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.WriteTask", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "WriteTask.request_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WriteTask.dst_engine_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WriteTask.local_block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WriteTask.remote_block_ids_hint", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WriteTask.layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WriteTask.event", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WriteTask.remote_notify_port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WriteTask.remote_ip", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WriteTask.enqueue_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WriteTask.retried", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.TransferError", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.ROLE", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ROLE.PRODUCER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROLE.CONSUMER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROLE.NOTINIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.MoRIIOMode", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MoRIIOMode.READ", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoRIIOMode.WRITE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.ReqMeta", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ReqMeta.local_block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.remote_block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.remote_host", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.remote_port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.remote_handshake_port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.remote_notify_port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.remote_engine_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.remote_dp_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 9, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.get_role", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.set_role", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.get_moriio_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.RoleManager", "methods": [ { "kind": "function", "name": "RoleManager.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RoleManager.get_instance", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RoleManager.set_role", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RoleManager.get_role", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RoleManager._instance", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RoleManager._lock", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.MoRIIOError", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.MoRIIOConnectorMetadata", "methods": [ { "kind": "function", "name": "MoRIIOConnectorMetadata.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOConnectorMetadata.__repr__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOConnectorMetadata.add_new_req", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoRIIOConnectorMetadata.reqs_to_recv", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorMetadata.reqs_to_save", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorMetadata.reqs_to_send", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.get_port_offset", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [ { "kind": "type", "rules": [ "call-arg" ] } ], "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.EngineId", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.HandshakeError", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.LayerTransferPlan", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.MoRIIOAgentMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.MoRIIOConfig", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.MoRIIOConnectorMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.MoRIIOConstants", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.MoRIIOError", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.MoRIIOMode", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.ROLE", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.RemoteAllocInfo", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.ReqId", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.ReqMeta", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.RoleManager", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.Transfer", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.TransferError", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.WriteTask", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.get_moriio_mode", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.get_port_offset", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.get_role", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.logger", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.set_role", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_common.zmq_ctx" ], "n_typable": 37, "n_typed": 29, "n_any": 1, "n_untyped": 7, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 6, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 6, "n_classes": 14, "n_attrs": 71, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/moriio/moriio_connector.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_connector.is_moriio_available", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_connector.MoRIIOConnectorWorker", "methods": [ { "kind": "function", "name": "MoRIIOConnectorWorker.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoRIIOConnectorWorker.schedule_write_blocks", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "MoRIIOConnectorWorker._get_built_session", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOConnectorWorker._ping", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOConnectorWorker.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOConnectorWorker.__del__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOConnectorWorker._moriio_handshake_listener", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MoRIIOConnectorWorker._moriio_handshake", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MoRIIOConnectorWorker._background_moriio_handshake", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MoRIIOConnectorWorker.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOConnectorWorker.get_finished", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOConnectorWorker._pop_done_transfers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOConnectorWorker.save_kv_layer", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MoRIIOConnectorWorker.get_engine_name_with_dp", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoRIIOConnectorWorker.start_load_kv", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOConnectorWorker._read_blocks_for_req", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoRIIOConnectorWorker._write_blocks_for_req", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MoRIIOConnectorWorker._is_last_layer", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOConnectorWorker.merge_contiguous_blocks", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MoRIIOConnectorWorker._compute_block_transfer_offsets", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MoRIIOConnectorWorker._read_blocks", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoRIIOConnectorWorker.moriio_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.kv_transfer_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.is_producer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.dp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.local_ip", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.local_kv_port", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.proxy_ip", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.local_ping_port", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.proxy_ping_port", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.http_port", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.handshake_port", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.notify_port", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.zmq_context", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.metadata_address", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.request_address", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.moriio_engine", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.moriio_wrapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.local_kv_cache_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.local_kv_cache_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.layer_name_to_local_kv_cache_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.remote_kv_cache_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.remote_kv_cache_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.layer_name_to_remote_kv_cache_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.remote_moriio_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.slot_size_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.load_ready_flag", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.write_ready_flags", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.kv_cache_shape", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.block_shape", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.kv_element_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.side_channel_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.engine_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.tp_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.kv_caches_base_addr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.num_regions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.num_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.dst_num_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.block_window_per_layer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.use_mla", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.built_session", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.built_write_session", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorWorker.backend_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 127, "n_typed": 71, "n_any": 0, "n_untyped": 56, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 56, "n_attrs": 50, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_connector.MoRIIOConnector", "methods": [ { "kind": "function", "name": "MoRIIOConnector.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MoRIIOConnector._set_port_defaults", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOConnector.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoRIIOConnector.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MoRIIOConnector.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOConnector.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoRIIOConnector.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOConnector.get_finished", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOConnector.start_load_kv", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoRIIOConnector.wait_for_layer_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOConnector.save_kv_layer", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MoRIIOConnector.wait_for_save", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOConnector.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOConnector.has_connector_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoRIIOConnector.kv_transfer_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnector.engine_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnector.mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnector.connector_scheduler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnector.connector_worker", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 40, "n_typed": 29, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 21, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_connector.MoRIIO_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_connector.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_connector.MoRIIOConnectorScheduler", "methods": [ { "kind": "function", "name": "MoRIIOConnectorScheduler.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoRIIOConnectorScheduler.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoRIIOConnectorScheduler.send_notify_block", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MoRIIOConnectorScheduler.update_state_after_alloc", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MoRIIOConnectorScheduler.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOConnectorScheduler.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOConnectorScheduler.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoRIIOConnectorScheduler.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorScheduler.kv_transfer_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorScheduler.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorScheduler.engine_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorScheduler.mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorScheduler.host_ip", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorScheduler.handshake_port", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorScheduler.side_notify_port", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorScheduler.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorScheduler.dp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorScheduler.is_producer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOConnectorScheduler.paths", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 34, "n_typed": 18, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 15, "n_attrs": 12, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_connector", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_connector.MoRIIOConnector", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_connector.MoRIIOConnectorScheduler", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_connector.MoRIIOConnectorWorker", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_connector.MoRIIO_enabled", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_connector.is_moriio_available", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_connector.logger" ], "n_typable": 203, "n_typed": 119, "n_any": 0, "n_untyped": 84, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 42, "n_method_overloads": 42, "n_method_params": 92, "n_classes": 3, "n_attrs": 69, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/moriio/moriio_engine.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_engine.MoRIIOWrapper", "methods": [ { "kind": "function", "name": "MoRIIOWrapper.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MoRIIOWrapper.set_moriio_engine", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOWrapper.set_backend_type", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOWrapper.get_agent_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOWrapper.register_remote_engine", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOWrapper.register_local_tensor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOWrapper.get_unpack_memory_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOWrapper.build_session", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoRIIOWrapper.read_remote_data", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MoRIIOWrapper.write_remote_data", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MoRIIOWrapper.write_remote_data_single", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MoRIIOWrapper.waiting_for_transfer_complete", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOWrapper.async_wait_reqid", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOWrapper._handle_message", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOWrapper._handle_structured_message", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOWrapper._handle_completion_message", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOWrapper.send_notify", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MoRIIOWrapper.pop_finished_req_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOWrapper.pop_finished_write_req_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOWrapper.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoRIIOWrapper.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOWrapper.dp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOWrapper.moriio_engine", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOWrapper.remote_memory_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOWrapper.local_memory_registered", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOWrapper.local_memory_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOWrapper.transfer_status", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOWrapper.remote_engine_ip", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOWrapper.notify_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOWrapper.lock", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOWrapper.done_req_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOWrapper.done_remote_allocate_req_dict", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOWrapper.done_write_cache_req_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOWrapper.notify_thread", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOWrapper.sessions", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MoRIIOWrapper.paths", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 64, "n_typed": 16, "n_any": 0, "n_untyped": 48, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 20, "n_method_overloads": 20, "n_method_params": 28, "n_attrs": 16, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_engine.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_engine.MoRIIOWriter", "methods": [ { "kind": "function", "name": "MoRIIOWriter.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOWriter.ensure_worker_started", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOWriter.schedule_write", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOWriter._write_worker_loop", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOWriter._process_deferred_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoRIIOWriter._is_remote_ready", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOWriter._get_remote_alloc_info", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOWriter._execute_write_task", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoRIIOWriter._prepare_transfer_plan", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MoRIIOWriter._do_layer_write", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoRIIOWriter._finalize_if_complete", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "MoRIIOWriter.worker", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 24, "n_typed": 23, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 12, "n_attrs": 0, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_engine", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_engine.MoRIIOWrapper", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_engine.MoRIIOWriter", "vllm.distributed.kv_transfer.kv_connector.v1.moriio.moriio_engine.logger" ], "n_typable": 89, "n_typed": 39, "n_any": 0, "n_untyped": 50, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 31, "n_method_overloads": 31, "n_method_params": 40, "n_classes": 2, "n_attrs": 17, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/multi_connector.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.multi_connector.MultiKVConnectorStats", "methods": [ { "kind": "function", "name": "MultiKVConnectorStats.aggregate", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiKVConnectorStats.reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiKVConnectorStats.reduce", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiKVConnectorStats.is_empty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiKVConnectorStats.__getitem__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiKVConnectorStats.__setitem__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.multi_connector.MultiConnector", "methods": [ { "kind": "function", "name": "MultiConnector.requires_piecewise_for_cudagraph", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiConnector.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MultiConnector._get_connector_classes_and_configs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiConnector.register_cross_layers_kv_cache", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiConnector.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiConnector.bind_connector_metadata", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiConnector.clear_connector_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiConnector.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiConnector.start_load_kv", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiConnector.wait_for_layer_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiConnector.save_kv_layer", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MultiConnector.wait_for_save", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiConnector.get_finished", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiConnector.get_block_ids_with_load_errors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiConnector.set_host_xfer_buffer_ops", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiConnector.handle_preemptions", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiConnector.get_finished_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiConnector.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiConnector.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MultiConnector.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiConnector.update_connector_output", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiConnector.get_handshake_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiConnector.set_xfer_handshake_metadata", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiConnector.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiConnector.take_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiConnector.get_required_kvcache_layout", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiConnector.build_kv_connector_stats", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiConnector.get_kv_connector_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiConnector.build_prom_metrics", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MultiConnector.reset_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "MultiConnector.prefer_cross_layer_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 66, "n_typed": 55, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 30, "n_method_overloads": 30, "n_method_params": 35, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.multi_connector.MultiKVConnectorPromMetrics", "methods": [ { "kind": "function", "name": "MultiKVConnectorPromMetrics.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MultiKVConnectorPromMetrics.observe", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.multi_connector.MultiKVConnectorMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiKVConnectorMetadata.metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiKVConnectorMetadata.extra_async_saves", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.multi_connector.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.multi_connector", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.multi_connector.MultiConnector", "vllm.distributed.kv_transfer.kv_connector.v1.multi_connector.MultiKVConnectorMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.multi_connector.MultiKVConnectorPromMetrics", "vllm.distributed.kv_transfer.kv_connector.v1.multi_connector.MultiKVConnectorStats", "vllm.distributed.kv_transfer.kv_connector.v1.multi_connector.logger" ], "n_typable": 86, "n_typed": 70, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 38, "n_method_overloads": 38, "n_method_params": 46, "n_classes": 4, "n_attrs": 3, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.nixlXferTelemetry", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.GET_META_MSG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlPromMetrics", "methods": [ { "kind": "function", "name": "NixlPromMetrics.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NixlPromMetrics.observe", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NixlPromMetrics.nixl_histogram_xfer_time", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlPromMetrics.nixl_histogram_post_time", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlPromMetrics.nixl_histogram_bytes_transferred", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlPromMetrics.nixl_histogram_num_descriptors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlPromMetrics.counter_nixl_num_failed_transfers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlPromMetrics.counter_nixl_num_failed_notifications", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlPromMetrics.counter_nixl_num_kv_expired_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 6, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.nixl_agent_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NIXL_CONNECTOR_VERSION", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.zmq_ctx", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.ReqId", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlKVConnectorStats", "methods": [ { "kind": "function", "name": "NixlKVConnectorStats.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlKVConnectorStats.reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlKVConnectorStats.record_transfer", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlKVConnectorStats.record_failed_transfer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlKVConnectorStats.record_failed_notification", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlKVConnectorStats.record_kv_expired_req", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlKVConnectorStats.clone_and_reset", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlKVConnectorStats.is_empty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlKVConnectorStats.aggregate", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlKVConnectorStats.reduce", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "NixlKVConnectorStats.num_successful_transfers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 13, "n_typed": 7, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 2, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlConnector", "methods": [ { "kind": "function", "name": "NixlConnector.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "NixlConnector.get_required_kvcache_layout", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnector.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NixlConnector.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "NixlConnector.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnector.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NixlConnector.set_xfer_handshake_metadata", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnector.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnector.register_cross_layers_kv_cache", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NixlConnector.set_host_xfer_buffer_ops", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnector.get_finished", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnector.get_block_ids_with_load_errors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlConnector.get_kv_connector_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlConnector.build_kv_connector_stats", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnector.build_prom_metrics", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NixlConnector.start_load_kv", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NixlConnector.wait_for_layer_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnector.save_kv_layer", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NixlConnector.wait_for_save", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlConnector.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlConnector.get_handshake_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "NixlConnector.prefer_cross_layer_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "NixlConnector.engine_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnector.kv_transfer_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnector.connector_scheduler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnector.connector_worker", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 56, "n_typed": 45, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 30, "n_attrs": 4, "n_properties": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlConnectorMetadata", "methods": [ { "kind": "function", "name": "NixlConnectorMetadata.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlConnectorMetadata._add_new_req", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NixlConnectorMetadata.add_new_req_to_save", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "NixlConnectorMetadata.add_new_req_to_recv", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NixlConnectorMetadata.reqs_to_recv", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorMetadata.reqs_to_save", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorMetadata.reqs_to_send", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorMetadata.reqs_in_batch", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorMetadata.reqs_not_processed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 17, "n_typed": 14, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlHandshakePayload", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NixlHandshakePayload.compatibility_hash", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NixlHandshakePayload.agent_metadata_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.RemoteMeta", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RemoteMeta.block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RemoteMeta.host", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RemoteMeta.port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RemoteMeta.engine_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RemoteMeta.request_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.compute_nixl_compatibility_hash", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlAgentMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NixlAgentMetadata.engine_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NixlAgentMetadata.agent_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NixlAgentMetadata.kv_caches_base_addr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NixlAgentMetadata.device_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NixlAgentMetadata.num_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NixlAgentMetadata.block_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NixlAgentMetadata.kv_cache_layout", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NixlAgentMetadata.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.ReqMeta", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ReqMeta.local_block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.local_physical_block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.remote", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlConnectorWorker", "methods": [ { "kind": "function", "name": "NixlConnectorWorker.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NixlConnectorWorker._nixl_handshake", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NixlConnectorWorker.initialize_host_xfer_buffer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnectorWorker.set_host_xfer_buffer_ops", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnectorWorker._log_failure", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "NixlConnectorWorker._background_nixl_handshake", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "NixlConnectorWorker.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnectorWorker.register_local_xfer_handler", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnectorWorker.add_remote_agent", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "NixlConnectorWorker._validate_remote_agent_handshake", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NixlConnectorWorker.sync_recved_kv_to_device", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NixlConnectorWorker.save_kv_to_host", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnectorWorker.post_process_device_kv_on_receive", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NixlConnectorWorker.get_finished", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlConnectorWorker._get_new_notifs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlConnectorWorker._pop_done_transfers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnectorWorker._handle_failed_transfer", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NixlConnectorWorker.start_load_kv", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnectorWorker._read_blocks_for_req", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NixlConnectorWorker._read_blocks", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "NixlConnectorWorker.get_mapped_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NixlConnectorWorker._get_block_descs_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NixlConnectorWorker._logical_to_kernel_block_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnectorWorker.get_backend_aware_kv_block_len", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnectorWorker.get_kv_connector_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlConnectorWorker.get_block_ids_with_load_errors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlConnectorWorker.__del__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlConnectorWorker.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NixlConnectorWorker.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.kv_transfer_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.nixl_backends", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.nixl_wrapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.engine_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.tp_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.num_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.enable_permute_local_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.device_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.kv_buffer_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.device_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.host_xfer_buffers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.nixl_memory_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.copy_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.device_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.kv_caches_base_addr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.num_regions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.num_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.src_xfer_handles_by_block_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.src_xfer_handles_by_tp_ratio", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.dst_xfer_side_handles", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.dst_num_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.xfer_handshake_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.block_window_per_layer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.use_mla", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.backend_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.kv_cache_layout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.host_buffer_kv_cache_layout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.compat_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.kv_topo", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.consumer_notification_counts_by_req", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.xfer_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.enforce_compat_hash", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorWorker.use_host_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 119, "n_typed": 73, "n_any": 0, "n_untyped": 46, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 28, "n_method_overloads": 28, "n_method_params": 51, "n_attrs": 40, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlConnectorScheduler", "methods": [ { "kind": "function", "name": "NixlConnectorScheduler.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NixlConnectorScheduler.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NixlConnectorScheduler.set_xfer_handshake_metadata", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnectorScheduler._nixl_handshake_listener", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NixlConnectorScheduler.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NixlConnectorScheduler.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "NixlConnectorScheduler.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NixlConnectorScheduler.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NixlConnectorScheduler.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorScheduler.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorScheduler.engine_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorScheduler.side_channel_host", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorScheduler.side_channel_port", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NixlConnectorScheduler.use_host_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 20, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 15, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.TransferHandle", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlWrapper", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.GET_META_MSG", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NIXL_CONNECTOR_VERSION", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlAgentMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlConnector", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlConnectorMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlConnectorScheduler", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlConnectorWorker", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlHandshakePayload", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlKVConnectorStats", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlPromMetrics", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.NixlWrapper", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.RemoteMeta", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.ReqId", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.ReqMeta", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.TransferHandle", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.compute_nixl_compatibility_hash", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.logger", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.nixlXferTelemetry", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.nixl_agent_config", "vllm.distributed.kv_transfer.kv_connector.v1.nixl_connector.zmq_ctx" ], "n_typable": 258, "n_typed": 172, "n_any": 1, "n_untyped": 85, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 5, "n_methods": 73, "n_method_overloads": 73, "n_method_params": 112, "n_classes": 10, "n_attrs": 89, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/offloading_connector.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.OffloadingConnectorMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "OffloadingConnectorMetadata.reqs_to_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OffloadingConnectorMetadata.reqs_to_store", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.ReqId", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.OffloadingConnectorScheduler", "methods": [ { "kind": "function", "name": "OffloadingConnectorScheduler.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnectorScheduler._get_block_hashes", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OffloadingConnectorScheduler.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OffloadingConnectorScheduler.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OffloadingConnectorScheduler._get_reqs_to_store", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnectorScheduler.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnectorScheduler.update_connector_output", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnectorScheduler.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OffloadingConnectorScheduler.take_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OffloadingConnectorScheduler.gpu_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OffloadingConnectorScheduler.offloaded_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OffloadingConnectorScheduler.block_size_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OffloadingConnectorScheduler.manager", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 27, "n_typed": 20, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 14, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.OffloadingConnector", "methods": [ { "kind": "function", "name": "OffloadingConnector.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OffloadingConnector.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnector.register_cross_layers_kv_cache", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OffloadingConnector.handle_preemptions", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnector.start_load_kv", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OffloadingConnector.wait_for_layer_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnector.save_kv_layer", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OffloadingConnector.wait_for_save", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OffloadingConnector.get_finished", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnector.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OffloadingConnector.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OffloadingConnector.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnector.update_connector_output", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnector.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OffloadingConnector.take_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OffloadingConnector.get_kv_connector_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OffloadingConnector.build_kv_connector_stats", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnector.build_prom_metrics", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "OffloadingConnector.prefer_cross_layer_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "OffloadingConnector.connector_scheduler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OffloadingConnector.connector_worker", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 50, "n_typed": 41, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 29, "n_attrs": 2, "n_properties": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.OffloadingConnectorWorker", "methods": [ { "kind": "function", "name": "OffloadingConnectorWorker.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnectorWorker._generate_job_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OffloadingConnectorWorker._register_handlers", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OffloadingConnectorWorker.register_kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnectorWorker.register_cross_layers_kv_cache", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OffloadingConnectorWorker.handle_preemptions", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnectorWorker.start_kv_transfers", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnectorWorker.prepare_store_kv", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnectorWorker.get_finished", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnectorWorker.get_kv_connector_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OffloadingConnectorWorker.spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OffloadingConnectorWorker.worker", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OffloadingConnectorWorker.kv_connector_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 13, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 10, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.OffloadingConnectorStats", "methods": [ { "kind": "function", "name": "OffloadingConnectorStats.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OffloadingConnectorStats.reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OffloadingConnectorStats.aggregate", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingConnectorStats.reduce", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OffloadingConnectorStats.is_empty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OffloadingConnectorStats.record_transfer", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 7, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.OffloadPromMetrics", "methods": [ { "kind": "function", "name": "OffloadPromMetrics.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OffloadPromMetrics.observe", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OffloadPromMetrics.histogram_transfer_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OffloadPromMetrics.counter_kv_bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OffloadPromMetrics.counter_kv_transfer_time", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.OffloadingOperationMetrics", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "OffloadingOperationMetrics.op_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OffloadingOperationMetrics.op_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.OffloadPromMetrics", "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.OffloadingConnector", "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.OffloadingConnectorMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.OffloadingConnectorScheduler", "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.OffloadingConnectorStats", "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.OffloadingConnectorWorker", "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.OffloadingOperationMetrics", "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.ReqId", "vllm.distributed.kv_transfer.kv_connector.v1.offloading_connector.logger" ], "n_typable": 122, "n_typed": 90, "n_any": 0, "n_untyped": 32, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 45, "n_method_overloads": 45, "n_method_params": 63, "n_classes": 7, "n_attrs": 18, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/p2p/p2p_nccl_connector.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_connector.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_connector.P2pNcclConnectorMetadata", "methods": [ { "kind": "function", "name": "P2pNcclConnectorMetadata.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "P2pNcclConnectorMetadata.add_request", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "P2pNcclConnectorMetadata.requests", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_connector.ReqMeta", "methods": [ { "kind": "function", "name": "ReqMeta.make_meta", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ReqMeta.request_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReqMeta.num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_connector.P2pNcclConnector", "methods": [ { "kind": "function", "name": "P2pNcclConnector.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "P2pNcclConnector.start_load_kv", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "P2pNcclConnector.wait_for_layer_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "P2pNcclConnector.save_kv_layer", "n_typed": 4, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "P2pNcclConnector.wait_for_save", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "P2pNcclConnector.get_finished", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "P2pNcclConnector.get_num_new_matched_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "P2pNcclConnector.update_state_after_alloc", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "P2pNcclConnector.build_connector_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "P2pNcclConnector.request_finished", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "P2pNcclConnector.parse_request_id", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "P2pNcclConnector.check_tensors_except_dim", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "P2pNcclConnector.is_producer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclConnector.chunked_prefill", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclConnector.p2p_nccl_engine", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 27, "n_any": 3, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 25, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_connector", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_connector.P2pNcclConnector", "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_connector.P2pNcclConnectorMetadata", "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_connector.ReqMeta", "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_connector.logger" ], "n_typable": 52, "n_typed": 37, "n_any": 3, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 33, "n_classes": 3, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/p2p/p2p_nccl_engine.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_engine.DEFAULT_MEM_POOL_SIZE_GB", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_engine.P2pNcclEngine", "methods": [ { "kind": "function", "name": "P2pNcclEngine.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "P2pNcclEngine.create_connect", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "P2pNcclEngine.send_tensor", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "P2pNcclEngine.recv_tensor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "P2pNcclEngine.listen_for_requests", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "P2pNcclEngine.have_sent_tensor_id", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "P2pNcclEngine.have_received_tensor_id", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "P2pNcclEngine.send_async", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "P2pNcclEngine.wait_for_sent", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "P2pNcclEngine.send_sync", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "P2pNcclEngine.get_finished", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "P2pNcclEngine.ping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "P2pNcclEngine.send", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "P2pNcclEngine.recv", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "P2pNcclEngine.close", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "P2pNcclEngine.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.local_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.nccl", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.zmq_address", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.context", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.router_socket", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.poller", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.send_store_cv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.send_queue_cv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.recv_store_cv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.send_stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.recv_stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.pool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.send_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.recv_store", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.recv_request_id_to_tensor_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.send_request_id_to_tensor_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.socks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.comms", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.buffer_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.buffer_size_threshold", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.nccl_num_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.proxy_address", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.http_address", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.send_store", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "P2pNcclEngine.send_queue", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 67, "n_typed": 32, "n_any": 0, "n_untyped": 35, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 24, "n_attrs": 28, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_engine.set_p2p_nccl_context", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_engine.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_engine.SendQueueItem", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SendQueueItem.tensor_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SendQueueItem.remote_address", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SendQueueItem.tensor", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_engine", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_engine.DEFAULT_MEM_POOL_SIZE_GB", "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_engine.P2pNcclEngine", "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_engine.SendQueueItem", "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_engine.logger", "vllm.distributed.kv_transfer.kv_connector.v1.p2p.p2p_nccl_engine.set_p2p_nccl_context" ], "n_typable": 70, "n_typed": 33, "n_any": 0, "n_untyped": 37, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 24, "n_classes": 2, "n_attrs": 33, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/kv_transfer/kv_connector/v1/p2p/tensor_memory_pool.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.p2p.tensor_memory_pool.MemoryBlock", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MemoryBlock.size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MemoryBlock.addr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.kv_transfer.kv_connector.v1.p2p.tensor_memory_pool.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.kv_transfer.kv_connector.v1.p2p.tensor_memory_pool.TensorMemoryPool", "methods": [ { "kind": "function", "name": "TensorMemoryPool.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TensorMemoryPool._round_to_power_of_two", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TensorMemoryPool._initialize_free_lists", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TensorMemoryPool._allocate_pinned_memory", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TensorMemoryPool.allocate", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TensorMemoryPool._split_block", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TensorMemoryPool.free", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TensorMemoryPool._merge_buddies", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TensorMemoryPool.store_tensor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TensorMemoryPool.load_tensor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "TensorMemoryPool.cleanup", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TensorMemoryPool.__del__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TensorMemoryPool.max_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TensorMemoryPool.min_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TensorMemoryPool.free_lists", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TensorMemoryPool.allocated_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 29, "n_typed": 19, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 13, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.kv_transfer.kv_connector.v1.p2p.tensor_memory_pool", "names": [ "vllm.distributed.kv_transfer.kv_connector.v1.p2p.tensor_memory_pool.MemoryBlock", "vllm.distributed.kv_transfer.kv_connector.v1.p2p.tensor_memory_pool.TensorMemoryPool", "vllm.distributed.kv_transfer.kv_connector.v1.p2p.tensor_memory_pool.logger" ], "n_typable": 30, "n_typed": 19, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 13, "n_classes": 2, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/parallel_state.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.parallel_state.GraphCaptureContext", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "GraphCaptureContext.stream", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.parallel_state.Handle", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.model_parallel_is_initialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.get_tensor_model_parallel_world_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.get_node_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.get_dp_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.get_pp_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.initialize_model_parallel", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.distributed.parallel_state.destroy_distributed_environment", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.get_dcp_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.get_decode_context_model_parallel_world_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.get_inner_dp_world_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.all_gather_fake", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.distributed.parallel_state.TensorMetadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.init_world_group", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.distributed.parallel_state.init_model_parallel_group", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.distributed.parallel_state.get_tp_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.is_global_first_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.in_the_same_node_as", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.distributed.parallel_state.get_decode_context_model_parallel_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.all_gather", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.distributed.parallel_state.patched_fused_scaled_matmul_reduce_scatter", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "vllm.distributed.parallel_state.graph_capture", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.distributed.parallel_state.get_pcp_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.patch_tensor_parallel_group", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.distributed.parallel_state.all_reduce", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.distributed.parallel_state.patched_fused_scaled_matmul_reduce_scatter_fake", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "vllm.distributed.parallel_state.get_world_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.set_custom_all_reduce", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.distributed.parallel_state.ensure_model_parallel_initialized", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.distributed.parallel_state.init_distributed_environment", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.distributed.parallel_state.is_local_first_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.get_ep_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.distributed.parallel_state.GroupCoordinator", "methods": [ { "kind": "function", "name": "GroupCoordinator.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "GroupCoordinator.create_mq_broadcaster", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GroupCoordinator.create_single_reader_mq_broadcasters", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GroupCoordinator.graph_capture", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GroupCoordinator.all_reduce", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GroupCoordinator._all_reduce_out_place", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GroupCoordinator.all_gather", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GroupCoordinator._all_gather_out_place", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GroupCoordinator.all_gatherv", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GroupCoordinator.reduce_scatter", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GroupCoordinator.reduce_scatterv", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GroupCoordinator._reduce_scatter_out_place", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GroupCoordinator.gather", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GroupCoordinator.broadcast", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GroupCoordinator.broadcast_object", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GroupCoordinator.broadcast_object_list", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GroupCoordinator.send_object", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GroupCoordinator.recv_object", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GroupCoordinator.broadcast_tensor_dict", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GroupCoordinator._should_use_all_gather", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GroupCoordinator.send_tensor_dict", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GroupCoordinator.isend_tensor_dict", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GroupCoordinator.recv_tensor_dict", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GroupCoordinator.irecv_tensor_dict", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GroupCoordinator.barrier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GroupCoordinator.send", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GroupCoordinator.recv", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GroupCoordinator.destroy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GroupCoordinator.prepare_communication_buffer_for_model", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GroupCoordinator.dispatch_router_logits", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GroupCoordinator.dispatch", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "GroupCoordinator.combine", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "GroupCoordinator.first_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "GroupCoordinator.last_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "GroupCoordinator.is_first_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "GroupCoordinator.is_last_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "GroupCoordinator.next_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "GroupCoordinator.prev_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "GroupCoordinator.rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GroupCoordinator.ranks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GroupCoordinator.world_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GroupCoordinator.local_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GroupCoordinator.rank_in_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GroupCoordinator.cpu_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GroupCoordinator.device_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GroupCoordinator.device_communicator", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GroupCoordinator.mq_broadcaster", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GroupCoordinator.unique_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupCoordinator.use_device_communicator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupCoordinator.use_custom_op_call", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupCoordinator.use_cpu_custom_send_recv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupCoordinator.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 132, "n_typed": 102, "n_any": 2, "n_untyped": 28, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 32, "n_method_overloads": 32, "n_method_params": 80, "n_attrs": 14, "n_properties": 6 }, { "kind": "function", "name": "vllm.distributed.parallel_state.cleanup_dist_env_and_memory", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.distributed.parallel_state.get_tensor_model_parallel_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.distributed.parallel_state.reduce_scatter", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.distributed.parallel_state.reduce_scatter_fake", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.distributed.parallel_state.all_reduce_fake", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.distributed.parallel_state.prepare_communication_buffer_for_model", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.distributed.parallel_state.get_eplb_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.distributed.parallel_state.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.distributed.parallel_state.destroy_model_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.distributed.parallel_state", "names": [ "vllm.distributed.parallel_state.GraphCaptureContext", "vllm.distributed.parallel_state.GroupCoordinator", "vllm.distributed.parallel_state.Handle", "vllm.distributed.parallel_state.TensorMetadata", "vllm.distributed.parallel_state.all_gather", "vllm.distributed.parallel_state.all_gather_fake", "vllm.distributed.parallel_state.all_reduce", "vllm.distributed.parallel_state.all_reduce_fake", "vllm.distributed.parallel_state.cleanup_dist_env_and_memory", "vllm.distributed.parallel_state.destroy_distributed_environment", "vllm.distributed.parallel_state.destroy_model_parallel", "vllm.distributed.parallel_state.ensure_model_parallel_initialized", "vllm.distributed.parallel_state.get_dcp_group", "vllm.distributed.parallel_state.get_decode_context_model_parallel_rank", "vllm.distributed.parallel_state.get_decode_context_model_parallel_world_size", "vllm.distributed.parallel_state.get_dp_group", "vllm.distributed.parallel_state.get_ep_group", "vllm.distributed.parallel_state.get_eplb_group", "vllm.distributed.parallel_state.get_inner_dp_world_group", "vllm.distributed.parallel_state.get_node_count", "vllm.distributed.parallel_state.get_pcp_group", "vllm.distributed.parallel_state.get_pp_group", "vllm.distributed.parallel_state.get_tensor_model_parallel_rank", "vllm.distributed.parallel_state.get_tensor_model_parallel_world_size", "vllm.distributed.parallel_state.get_tp_group", "vllm.distributed.parallel_state.get_world_group", "vllm.distributed.parallel_state.graph_capture", "vllm.distributed.parallel_state.in_the_same_node_as", "vllm.distributed.parallel_state.init_distributed_environment", "vllm.distributed.parallel_state.init_model_parallel_group", "vllm.distributed.parallel_state.init_world_group", "vllm.distributed.parallel_state.initialize_model_parallel", "vllm.distributed.parallel_state.is_global_first_rank", "vllm.distributed.parallel_state.is_local_first_rank", "vllm.distributed.parallel_state.logger", "vllm.distributed.parallel_state.model_parallel_is_initialized", "vllm.distributed.parallel_state.patch_tensor_parallel_group", "vllm.distributed.parallel_state.patched_fused_scaled_matmul_reduce_scatter", "vllm.distributed.parallel_state.patched_fused_scaled_matmul_reduce_scatter_fake", "vllm.distributed.parallel_state.prepare_communication_buffer_for_model", "vllm.distributed.parallel_state.reduce_scatter", "vllm.distributed.parallel_state.reduce_scatter_fake", "vllm.distributed.parallel_state.set_custom_all_reduce" ], "n_typable": 249, "n_typed": 209, "n_any": 2, "n_untyped": 38, "n_functions": 38, "n_function_overloads": 38, "n_function_params": 78, "n_methods": 32, "n_method_overloads": 32, "n_method_params": 80, "n_classes": 3, "n_attrs": 17, "n_properties": 6, "n_type_ignores": 0 }, { "path": "vllm/distributed/stateless_coordinator.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.distributed.stateless_coordinator.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.distributed.stateless_coordinator.StatelessGroupCoordinator", "methods": [ { "kind": "function", "name": "StatelessGroupCoordinator.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "StatelessGroupCoordinator.destroy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StatelessGroupCoordinator.size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StatelessGroupCoordinator.broadcast", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StatelessGroupCoordinator.broadcast_object", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StatelessGroupCoordinator.broadcast_object_list", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "StatelessGroupCoordinator.broadcast_tensor_dict", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "StatelessGroupCoordinator.send_object", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StatelessGroupCoordinator.recv_object", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StatelessGroupCoordinator.send_tensor_dict", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "StatelessGroupCoordinator.recv_tensor_dict", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "StatelessGroupCoordinator.barrier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StatelessGroupCoordinator.gather", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StatelessGroupCoordinator.unique_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatelessGroupCoordinator.rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatelessGroupCoordinator.local_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatelessGroupCoordinator.backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatelessGroupCoordinator.cpu_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatelessGroupCoordinator.device_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatelessGroupCoordinator.tcp_store_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatelessGroupCoordinator.use_device_communicator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatelessGroupCoordinator.device_communicator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatelessGroupCoordinator.mq_broadcaster", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatelessGroupCoordinator.use_custom_op_call", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatelessGroupCoordinator.use_cpu_custom_send_recv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatelessGroupCoordinator.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatelessGroupCoordinator.ranks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatelessGroupCoordinator.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatelessGroupCoordinator.rank_in_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 63, "n_typed": 38, "n_any": 0, "n_untyped": 25, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 34, "n_attrs": 16, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.stateless_coordinator", "names": [ "vllm.distributed.stateless_coordinator.StatelessGroupCoordinator", "vllm.distributed.stateless_coordinator.logger" ], "n_typable": 64, "n_typed": 38, "n_any": 0, "n_untyped": 26, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 34, "n_classes": 1, "n_attrs": 17, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.utils.init_gloo_process_group", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.distributed.utils.USE_SCHED_YIELD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.distributed.utils.stateless_init_torch_distributed_process_group", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.distributed.utils.get_pp_indices", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.distributed.utils.sched_yield", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.distributed.utils.StatelessProcessGroup", "methods": [ { "kind": "function", "name": "StatelessProcessGroup.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StatelessProcessGroup.send_obj", "n_typed": 1, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StatelessProcessGroup.expire_data", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StatelessProcessGroup.recv_obj", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StatelessProcessGroup.broadcast_obj", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StatelessProcessGroup.all_gather_obj", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StatelessProcessGroup.broadcast", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StatelessProcessGroup.send", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StatelessProcessGroup.recv", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StatelessProcessGroup.all_reduce", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StatelessProcessGroup.barrier", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StatelessProcessGroup.create", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StatelessProcessGroup.rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StatelessProcessGroup.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StatelessProcessGroup.store", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StatelessProcessGroup.socket", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StatelessProcessGroup.data_expiration_seconds", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StatelessProcessGroup.send_dst_counter", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StatelessProcessGroup.recv_src_counter", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StatelessProcessGroup.broadcast_send_counter", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StatelessProcessGroup.broadcast_recv_src_counter", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StatelessProcessGroup.entries", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 33, "n_typed": 23, "n_any": 4, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 21, "n_attrs": 10, "n_properties": 0 }, { "kind": "function", "name": "vllm.distributed.utils.get_worker_rank_suffix", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.distributed.utils.ensure_divisibility", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.distributed.utils.stateless_destroy_torch_distributed_process_group", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.distributed.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.distributed.utils.divide", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.distributed.utils.split_tensor_along_last_dim", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.distributed.utils", "names": [ "vllm.distributed.utils.StatelessProcessGroup", "vllm.distributed.utils.USE_SCHED_YIELD", "vllm.distributed.utils.divide", "vllm.distributed.utils.ensure_divisibility", "vllm.distributed.utils.get_pp_indices", "vllm.distributed.utils.get_worker_rank_suffix", "vllm.distributed.utils.init_gloo_process_group", "vllm.distributed.utils.logger", "vllm.distributed.utils.sched_yield", "vllm.distributed.utils.split_tensor_along_last_dim", "vllm.distributed.utils.stateless_destroy_torch_distributed_process_group", "vllm.distributed.utils.stateless_init_torch_distributed_process_group" ], "n_typable": 66, "n_typed": 48, "n_any": 4, "n_untyped": 14, "n_functions": 9, "n_function_overloads": 9, "n_function_params": 23, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 21, "n_classes": 1, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/weight_transfer/factory.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.weight_transfer.factory.WeightTransferEngineFactory", "methods": [ { "kind": "function", "name": "WeightTransferEngineFactory.register_engine", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "WeightTransferEngineFactory.create_engine", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WeightTransferEngineFactory._registry", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.weight_transfer.factory.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.distributed.weight_transfer.factory", "names": [ "vllm.distributed.weight_transfer.factory.WeightTransferEngineFactory", "vllm.distributed.weight_transfer.factory.logger" ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/weight_transfer/base.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.weight_transfer.base.WeightTransferInitRequest", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "WeightTransferInitRequest.init_info", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.weight_transfer.base.WeightTransferInitInfo", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.weight_transfer.base.WeightTransferUpdateRequest", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "WeightTransferUpdateRequest.update_info", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.weight_transfer.base.TUpdateInfo", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.distributed.weight_transfer.base.WeightTransferUpdateInfo", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "WeightTransferUpdateInfo._", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WeightTransferUpdateInfo.is_checkpoint_format", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.weight_transfer.base.WeightTransferEngine", "methods": [ { "kind": "function", "name": "WeightTransferEngine.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WeightTransferEngine.parse_init_info", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WeightTransferEngine.parse_update_info", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WeightTransferEngine.init_transfer_engine", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WeightTransferEngine.receive_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WeightTransferEngine.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WeightTransferEngine.trainer_send_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WeightTransferEngine.init_info_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "WeightTransferEngine.update_info_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "WeightTransferEngine.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WeightTransferEngine.parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 18, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 9, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.distributed.weight_transfer.base.TInitInfo", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.distributed.weight_transfer.base", "names": [ "vllm.distributed.weight_transfer.base.TInitInfo", "vllm.distributed.weight_transfer.base.TUpdateInfo", "vllm.distributed.weight_transfer.base.WeightTransferEngine", "vllm.distributed.weight_transfer.base.WeightTransferInitInfo", "vllm.distributed.weight_transfer.base.WeightTransferInitRequest", "vllm.distributed.weight_transfer.base.WeightTransferUpdateInfo", "vllm.distributed.weight_transfer.base.WeightTransferUpdateRequest" ], "n_typable": 20, "n_typed": 18, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 9, "n_classes": 5, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/weight_transfer/ipc_engine.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.weight_transfer.ipc_engine.IPCTrainerSendWeightsArgs", "methods": [ { "kind": "function", "name": "IPCTrainerSendWeightsArgs.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "IPCTrainerSendWeightsArgs.mode", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IPCTrainerSendWeightsArgs.llm_handle", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IPCTrainerSendWeightsArgs.url", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.weight_transfer.ipc_engine.IPCWeightTransferEngine", "methods": [ { "kind": "function", "name": "IPCWeightTransferEngine.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "IPCWeightTransferEngine.init_transfer_engine", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IPCWeightTransferEngine.receive_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "IPCWeightTransferEngine.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "IPCWeightTransferEngine.trainer_send_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "IPCWeightTransferEngine.init_info_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IPCWeightTransferEngine.update_info_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.weight_transfer.ipc_engine.IPCWeightTransferInitInfo", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.weight_transfer.ipc_engine.IPCWeightTransferUpdateInfo", "methods": [ { "kind": "function", "name": "IPCWeightTransferUpdateInfo.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "IPCWeightTransferUpdateInfo.names", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IPCWeightTransferUpdateInfo.dtype_names", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IPCWeightTransferUpdateInfo.shapes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IPCWeightTransferUpdateInfo.ipc_handles", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IPCWeightTransferUpdateInfo.ipc_handles_pickled", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.weight_transfer.ipc_engine", "names": [ "vllm.distributed.weight_transfer.ipc_engine.IPCTrainerSendWeightsArgs", "vllm.distributed.weight_transfer.ipc_engine.IPCWeightTransferEngine", "vllm.distributed.weight_transfer.ipc_engine.IPCWeightTransferInitInfo", "vllm.distributed.weight_transfer.ipc_engine.IPCWeightTransferUpdateInfo" ], "n_typable": 14, "n_typed": 12, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 7, "n_classes": 4, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/weight_transfer/nccl_engine.py", "symbol_reports": [ { "kind": "class", "name": "vllm.distributed.weight_transfer.nccl_engine.NCCLTrainerSendWeightsArgs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NCCLTrainerSendWeightsArgs.group", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLTrainerSendWeightsArgs.src", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLTrainerSendWeightsArgs.post_iter_func", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLTrainerSendWeightsArgs.packed", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLTrainerSendWeightsArgs.stream", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLTrainerSendWeightsArgs.packed_buffer_size_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLTrainerSendWeightsArgs.packed_num_buffers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.weight_transfer.nccl_engine.NCCLWeightTransferInitInfo", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NCCLWeightTransferInitInfo.master_address", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLWeightTransferInitInfo.master_port", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLWeightTransferInitInfo.rank_offset", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLWeightTransferInitInfo.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.weight_transfer.nccl_engine.NCCLWeightTransferEngine", "methods": [ { "kind": "function", "name": "NCCLWeightTransferEngine.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NCCLWeightTransferEngine.init_transfer_engine", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NCCLWeightTransferEngine.receive_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NCCLWeightTransferEngine.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NCCLWeightTransferEngine.trainer_send_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NCCLWeightTransferEngine.trainer_init", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NCCLWeightTransferEngine._stateless_init_process_group", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NCCLWeightTransferEngine.init_info_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLWeightTransferEngine.update_info_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLWeightTransferEngine.model_update_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 21, "n_typed": 15, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 13, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.distributed.weight_transfer.nccl_engine.NCCLWeightTransferUpdateInfo", "methods": [ { "kind": "function", "name": "NCCLWeightTransferUpdateInfo.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NCCLWeightTransferUpdateInfo.names", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLWeightTransferUpdateInfo.dtype_names", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLWeightTransferUpdateInfo.shapes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLWeightTransferUpdateInfo.packed", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLWeightTransferUpdateInfo.packed_buffer_size_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NCCLWeightTransferUpdateInfo.packed_num_buffers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.distributed.weight_transfer.nccl_engine", "names": [ "vllm.distributed.weight_transfer.nccl_engine.NCCLTrainerSendWeightsArgs", "vllm.distributed.weight_transfer.nccl_engine.NCCLWeightTransferEngine", "vllm.distributed.weight_transfer.nccl_engine.NCCLWeightTransferInitInfo", "vllm.distributed.weight_transfer.nccl_engine.NCCLWeightTransferUpdateInfo" ], "n_typable": 22, "n_typed": 15, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 13, "n_classes": 4, "n_attrs": 20, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/distributed/weight_transfer/packed_tensor.py", "symbol_reports": [ { "kind": "function", "name": "vllm.distributed.weight_transfer.packed_tensor.packed_broadcast_consumer", "n_typed": 6, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "attr", "name": "vllm.distributed.weight_transfer.packed_tensor.DEFAULT_PACKED_BUFFER_SIZE_BYTES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.distributed.weight_transfer.packed_tensor.DEFAULT_PACKED_NUM_BUFFERS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.distributed.weight_transfer.packed_tensor.packed_broadcast_producer", "n_typed": 6, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.distributed.weight_transfer.packed_tensor", "names": [ "vllm.distributed.weight_transfer.packed_tensor.DEFAULT_PACKED_BUFFER_SIZE_BYTES", "vllm.distributed.weight_transfer.packed_tensor.DEFAULT_PACKED_NUM_BUFFERS", "vllm.distributed.weight_transfer.packed_tensor.packed_broadcast_consumer", "vllm.distributed.weight_transfer.packed_tensor.packed_broadcast_producer" ], "n_typable": 14, "n_typed": 12, "n_any": 2, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 12, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/engine/protocol.py", "symbol_reports": [ { "kind": "class", "name": "vllm.engine.protocol.EngineClient", "methods": [ { "kind": "function", "name": "EngineClient.generate", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "EngineClient.encode", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "EngineClient.abort", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineClient.is_tracing_enabled", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineClient.do_log_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineClient.check_health", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineClient.start_profile", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineClient.stop_profile", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineClient.reset_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineClient.reset_encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineClient.reset_prefix_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineClient.sleep", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineClient.wake_up", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineClient.is_sleeping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineClient.add_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineClient.pause_generation", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EngineClient.resume_generation", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineClient.is_paused", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineClient.scale_elastic_ep", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineClient.collective_rpc", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EngineClient.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineClient.init_weight_transfer_engine", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineClient.update_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "EngineClient.is_running", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "EngineClient.is_stopped", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "EngineClient.errored", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "EngineClient.dead_error", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "EngineClient.vllm_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineClient.model_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineClient.renderer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineClient.io_processor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineClient.input_processor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 68, "n_typed": 67, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 23, "n_method_overloads": 23, "n_method_params": 36, "n_attrs": 5, "n_properties": 4 }, { "kind": "class", "name": "vllm.engine.protocol.StreamingInput", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "StreamingInput.prompt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingInput.sampling_params", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.engine.protocol", "names": [ "vllm.engine.protocol.EngineClient", "vllm.engine.protocol.StreamingInput" ], "n_typable": 68, "n_typed": 67, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 23, "n_method_overloads": 23, "n_method_params": 36, "n_classes": 2, "n_attrs": 7, "n_properties": 4, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/anthropic/api_router.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.anthropic.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.anthropic.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.anthropic.api_router.create_messages", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.anthropic.api_router.translate_error_response", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.anthropic.api_router.messages", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.anthropic.api_router.count_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.anthropic.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.anthropic.api_router", "names": [ "vllm.entrypoints.anthropic.api_router.attach_router", "vllm.entrypoints.anthropic.api_router.count_tokens", "vllm.entrypoints.anthropic.api_router.create_messages", "vllm.entrypoints.anthropic.api_router.logger", "vllm.entrypoints.anthropic.api_router.messages", "vllm.entrypoints.anthropic.api_router.router", "vllm.entrypoints.anthropic.api_router.translate_error_response" ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/anthropic/protocol.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.anthropic.protocol.AnthropicContextManagement", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AnthropicContextManagement.original_input_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.anthropic.protocol.AnthropicMessage", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AnthropicMessage.role", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessage.content", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.anthropic.protocol.AnthropicTool", "methods": [ { "kind": "function", "name": "AnthropicTool.validate_input_schema", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AnthropicTool.name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicTool.description", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicTool.input_schema", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.anthropic.protocol.AnthropicContentBlock", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AnthropicContentBlock.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicContentBlock.text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicContentBlock.source", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicContentBlock.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicContentBlock.tool_use_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicContentBlock.name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicContentBlock.input", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicContentBlock.content", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicContentBlock.is_error", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicContentBlock.thinking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicContentBlock.signature", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.anthropic.protocol.AnthropicErrorResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AnthropicErrorResponse.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicErrorResponse.error", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.anthropic.protocol.AnthropicDelta", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AnthropicDelta.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicDelta.text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicDelta.thinking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicDelta.partial_json", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicDelta.signature", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicDelta.stop_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicDelta.stop_sequence", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.anthropic.protocol.AnthropicStreamEvent", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AnthropicStreamEvent.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicStreamEvent.message", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicStreamEvent.delta", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicStreamEvent.content_block", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicStreamEvent.index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicStreamEvent.error", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicStreamEvent.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.anthropic.protocol.AnthropicCountTokensResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AnthropicCountTokensResponse.input_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicCountTokensResponse.context_management", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.anthropic.protocol.AnthropicMessagesRequest", "methods": [ { "kind": "function", "name": "AnthropicMessagesRequest.validate_model", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AnthropicMessagesRequest.validate_max_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AnthropicMessagesRequest.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesRequest.messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesRequest.max_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesRequest.metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesRequest.stop_sequences", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesRequest.stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesRequest.system", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesRequest.temperature", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesRequest.tool_choice", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesRequest.tools", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesRequest.top_k", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesRequest.top_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 16, "n_typed": 12, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.anthropic.protocol.AnthropicToolChoice", "methods": [ { "kind": "function", "name": "AnthropicToolChoice.validate_name_required_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AnthropicToolChoice.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicToolChoice.name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.anthropic.protocol.AnthropicMessagesResponse", "methods": [ { "kind": "function", "name": "AnthropicMessagesResponse.model_post_init", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AnthropicMessagesResponse.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesResponse.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesResponse.role", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesResponse.content", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesResponse.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesResponse.stop_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesResponse.stop_sequence", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicMessagesResponse.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 10, "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.anthropic.protocol.AnthropicCountTokensRequest", "methods": [ { "kind": "function", "name": "AnthropicCountTokensRequest.validate_model", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AnthropicCountTokensRequest.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicCountTokensRequest.messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicCountTokensRequest.system", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicCountTokensRequest.tool_choice", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicCountTokensRequest.tools", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.anthropic.protocol.AnthropicUsage", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AnthropicUsage.input_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicUsage.output_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicUsage.cache_creation_input_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicUsage.cache_read_input_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.anthropic.protocol.AnthropicError", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AnthropicError.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AnthropicError.message", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.anthropic.protocol", "names": [ "vllm.entrypoints.anthropic.protocol.AnthropicContentBlock", "vllm.entrypoints.anthropic.protocol.AnthropicContextManagement", "vllm.entrypoints.anthropic.protocol.AnthropicCountTokensRequest", "vllm.entrypoints.anthropic.protocol.AnthropicCountTokensResponse", "vllm.entrypoints.anthropic.protocol.AnthropicDelta", "vllm.entrypoints.anthropic.protocol.AnthropicError", "vllm.entrypoints.anthropic.protocol.AnthropicErrorResponse", "vllm.entrypoints.anthropic.protocol.AnthropicMessage", "vllm.entrypoints.anthropic.protocol.AnthropicMessagesRequest", "vllm.entrypoints.anthropic.protocol.AnthropicMessagesResponse", "vllm.entrypoints.anthropic.protocol.AnthropicStreamEvent", "vllm.entrypoints.anthropic.protocol.AnthropicTool", "vllm.entrypoints.anthropic.protocol.AnthropicToolChoice", "vllm.entrypoints.anthropic.protocol.AnthropicUsage" ], "n_typable": 79, "n_typed": 69, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 5, "n_classes": 14, "n_attrs": 68, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/anthropic/serving.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.anthropic.serving.wrap_data_with_event", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.anthropic.serving.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.anthropic.serving.AnthropicServingMessages", "methods": [ { "kind": "function", "name": "AnthropicServingMessages.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "AnthropicServingMessages._convert_image_source_to_url", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AnthropicServingMessages._convert_anthropic_to_openai_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AnthropicServingMessages._convert_system_message", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AnthropicServingMessages._convert_messages", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AnthropicServingMessages._convert_message_content", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AnthropicServingMessages._convert_block", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "AnthropicServingMessages._convert_tool_use_block", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AnthropicServingMessages._convert_tool_result_block", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AnthropicServingMessages._convert_user_tool_result", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AnthropicServingMessages._build_base_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AnthropicServingMessages._handle_streaming_options", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AnthropicServingMessages._convert_tool_choice", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AnthropicServingMessages._convert_tools", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AnthropicServingMessages.create_messages", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AnthropicServingMessages.messages_full_converter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AnthropicServingMessages.message_stream_converter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AnthropicServingMessages.count_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AnthropicServingMessages.stop_reason_map", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 68, "n_typed": 61, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 49, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.anthropic.serving", "names": [ "vllm.entrypoints.anthropic.serving.AnthropicServingMessages", "vllm.entrypoints.anthropic.serving.logger", "vllm.entrypoints.anthropic.serving.wrap_data_with_event" ], "n_typable": 72, "n_typed": 63, "n_any": 0, "n_untyped": 9, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 49, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/api_server.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.api_server.app", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.api_server.parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.api_server.health", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.entrypoints.api_server.args", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.api_server.init_app", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.api_server.build_app", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.api_server.engine", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.entrypoints.api_server.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.api_server.run_server", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.entrypoints.api_server.generate", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.api_server", "names": [ "vllm.entrypoints.api_server.app", "vllm.entrypoints.api_server.args", "vllm.entrypoints.api_server.build_app", "vllm.entrypoints.api_server.engine", "vllm.entrypoints.api_server.generate", "vllm.entrypoints.api_server.health", "vllm.entrypoints.api_server.init_app", "vllm.entrypoints.api_server.logger", "vllm.entrypoints.api_server.parser", "vllm.entrypoints.api_server.run_server" ], "n_typable": 16, "n_typed": 11, "n_any": 1, "n_untyped": 4, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/chat_utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.chat_utils.CustomChatCompletionContentSimpleAudioParam", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CustomChatCompletionContentSimpleAudioParam.audio_url", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.AudioURL", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AudioURL.url", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.BaseMultiModalItemTracker", "methods": [ { "kind": "function", "name": "BaseMultiModalItemTracker.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseMultiModalItemTracker.add", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalItemTracker.create_parser", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "BaseMultiModalItemTracker.use_unified_vision_chunk_modality", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "BaseMultiModalItemTracker.model_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "BaseMultiModalItemTracker.model_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "BaseMultiModalItemTracker.allowed_local_media_path", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "BaseMultiModalItemTracker.allowed_media_domains", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "BaseMultiModalItemTracker.mm_registry", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "BaseMultiModalItemTracker.mm_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 0, "n_properties": 7 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.CustomThinkCompletionContentParam", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CustomThinkCompletionContentParam.thinking", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CustomThinkCompletionContentParam.closed", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CustomThinkCompletionContentParam.type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.chat_utils.MODALITY_PLACEHOLDERS_MAP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.entrypoints.chat_utils.MM_PARSER_MAP", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.AsyncMultiModalItemTracker", "methods": [ { "kind": "function", "name": "AsyncMultiModalItemTracker.resolve_items", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncMultiModalItemTracker.create_parser", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.chat_utils.parse_chat_messages", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.entrypoints.chat_utils.load_chat_template", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.chat_utils.ModalityStr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.MultiModalContentParser", "methods": [ { "kind": "function", "name": "MultiModalContentParser.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalContentParser.parse_image", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalContentParser.parse_image_embeds", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalContentParser.parse_audio_embeds", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalContentParser.parse_image_pil", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalContentParser.parse_audio", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalContentParser.parse_input_audio", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalContentParser.parse_video", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "MultiModalContentParser.model_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 24, "n_typed": 24, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 15, "n_attrs": 0, "n_properties": 1 }, { "kind": "attr", "name": "vllm.entrypoints.chat_utils.ChatCompletionContentPartParam", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.chat_utils.ChatTemplateContentFormatOption", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.chat_utils.parse_chat_messages_async", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.ChatCompletionContentPartImageEmbedsParam", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCompletionContentPartImageEmbedsParam.image_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChatCompletionContentPartImageEmbedsParam.type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChatCompletionContentPartImageEmbedsParam.uuid", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.CustomChatCompletionContentSimpleVideoParam", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CustomChatCompletionContentSimpleVideoParam.video_url", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CustomChatCompletionContentSimpleVideoParam.uuid", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.PILImage", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PILImage.image_pil", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PILImage.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.AsyncMultiModalContentParser", "methods": [ { "kind": "function", "name": "AsyncMultiModalContentParser.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncMultiModalContentParser._image_with_uuid_async", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMultiModalContentParser.parse_image", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMultiModalContentParser.parse_image_embeds", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMultiModalContentParser.parse_audio_embeds", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMultiModalContentParser.parse_image_pil", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMultiModalContentParser._audio_with_uuid_async", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMultiModalContentParser.parse_audio", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMultiModalContentParser.parse_input_audio", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMultiModalContentParser._video_with_uuid_async", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMultiModalContentParser.parse_video", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "AsyncMultiModalContentParser.model_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 33, "n_typed": 30, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 21, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.ChatCompletionContentPartVideoParam", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCompletionContentPartVideoParam.video_url", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChatCompletionContentPartVideoParam.type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.CustomChatCompletionMessageParam", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CustomChatCompletionMessageParam.role", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CustomChatCompletionMessageParam.content", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CustomChatCompletionMessageParam.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CustomChatCompletionMessageParam.tool_call_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CustomChatCompletionMessageParam.tool_calls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CustomChatCompletionMessageParam.reasoning", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CustomChatCompletionMessageParam.tools", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.chat_utils.ChatTemplateContentFormat", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.chat_utils.validate_chat_template", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.chat_utils.torch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.VideoURL", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "VideoURL.url", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.chat_utils.make_tool_call_id", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.ConversationMessage", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ConversationMessage.role", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ConversationMessage.content", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ConversationMessage.tool_call_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ConversationMessage.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ConversationMessage.tool_calls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ConversationMessage.reasoning", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ConversationMessage.reasoning_content", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ConversationMessage.tools", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.CustomChatCompletionContentSimpleImageParam", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CustomChatCompletionContentSimpleImageParam.image_url", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CustomChatCompletionContentSimpleImageParam.uuid", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.chat_utils.ChatCompletionMessageParam", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.ChatCompletionContentPartAudioEmbedsParam", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCompletionContentPartAudioEmbedsParam.audio_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChatCompletionContentPartAudioEmbedsParam.type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChatCompletionContentPartAudioEmbedsParam.uuid", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.CustomChatCompletionContentPILImageParam", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CustomChatCompletionContentPILImageParam.image_pil", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CustomChatCompletionContentPILImageParam.uuid", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.BaseMultiModalContentParser", "methods": [ { "kind": "function", "name": "BaseMultiModalContentParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseMultiModalContentParser._add_placeholder", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalContentParser.mm_placeholder_storage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseMultiModalContentParser.parse_image", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalContentParser.parse_image_embeds", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalContentParser.parse_image_pil", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalContentParser.parse_audio", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalContentParser.parse_input_audio", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalContentParser.parse_audio_embeds", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalContentParser.parse_video", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 26, "n_typed": 25, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 16, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.chat_utils.PART_TYPES_TO_SKIP_NONE_CONTENT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.ChatTemplateResolutionError", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.chat_utils.get_history_tool_calls_cnt", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.ChatTemplateConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatTemplateConfig.chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChatTemplateConfig.chat_template_content_format", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChatTemplateConfig.trust_request_chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.chat_utils.transformers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.ChatCompletionContentPartAudioParam", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCompletionContentPartAudioParam.audio_url", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChatCompletionContentPartAudioParam.type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.chat_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.chat_utils.MultiModalItemTracker", "methods": [ { "kind": "function", "name": "MultiModalItemTracker.resolve_items", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiModalItemTracker.create_parser", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.chat_utils", "names": [ "vllm.entrypoints.chat_utils.AsyncMultiModalContentParser", "vllm.entrypoints.chat_utils.AsyncMultiModalItemTracker", "vllm.entrypoints.chat_utils.AudioURL", "vllm.entrypoints.chat_utils.BaseMultiModalContentParser", "vllm.entrypoints.chat_utils.BaseMultiModalItemTracker", "vllm.entrypoints.chat_utils.ChatCompletionContentPartAudioEmbedsParam", "vllm.entrypoints.chat_utils.ChatCompletionContentPartAudioParam", "vllm.entrypoints.chat_utils.ChatCompletionContentPartImageEmbedsParam", "vllm.entrypoints.chat_utils.ChatCompletionContentPartParam", "vllm.entrypoints.chat_utils.ChatCompletionContentPartVideoParam", "vllm.entrypoints.chat_utils.ChatCompletionMessageParam", "vllm.entrypoints.chat_utils.ChatTemplateConfig", "vllm.entrypoints.chat_utils.ChatTemplateContentFormat", "vllm.entrypoints.chat_utils.ChatTemplateContentFormatOption", "vllm.entrypoints.chat_utils.ChatTemplateResolutionError", "vllm.entrypoints.chat_utils.ConversationMessage", "vllm.entrypoints.chat_utils.CustomChatCompletionContentPILImageParam", "vllm.entrypoints.chat_utils.CustomChatCompletionContentSimpleAudioParam", "vllm.entrypoints.chat_utils.CustomChatCompletionContentSimpleImageParam", "vllm.entrypoints.chat_utils.CustomChatCompletionContentSimpleVideoParam", "vllm.entrypoints.chat_utils.CustomChatCompletionMessageParam", "vllm.entrypoints.chat_utils.CustomThinkCompletionContentParam", "vllm.entrypoints.chat_utils.MM_PARSER_MAP", "vllm.entrypoints.chat_utils.MODALITY_PLACEHOLDERS_MAP", "vllm.entrypoints.chat_utils.ModalityStr", "vllm.entrypoints.chat_utils.MultiModalContentParser", "vllm.entrypoints.chat_utils.MultiModalItemTracker", "vllm.entrypoints.chat_utils.PART_TYPES_TO_SKIP_NONE_CONTENT", "vllm.entrypoints.chat_utils.PILImage", "vllm.entrypoints.chat_utils.VideoURL", "vllm.entrypoints.chat_utils.get_history_tool_calls_cnt", "vllm.entrypoints.chat_utils.load_chat_template", "vllm.entrypoints.chat_utils.logger", "vllm.entrypoints.chat_utils.make_tool_call_id", "vllm.entrypoints.chat_utils.parse_chat_messages", "vllm.entrypoints.chat_utils.parse_chat_messages_async", "vllm.entrypoints.chat_utils.torch", "vllm.entrypoints.chat_utils.transformers", "vllm.entrypoints.chat_utils.validate_chat_template" ], "n_typable": 130, "n_typed": 112, "n_any": 0, "n_untyped": 18, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 13, "n_methods": 36, "n_method_overloads": 36, "n_method_params": 55, "n_classes": 22, "n_attrs": 53, "n_properties": 9, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/cli/benchmark/throughput.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.cli.benchmark.throughput.BenchmarkThroughputSubcommand", "methods": [ { "kind": "function", "name": "BenchmarkThroughputSubcommand.add_cli_args", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BenchmarkThroughputSubcommand.cmd", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BenchmarkThroughputSubcommand.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BenchmarkThroughputSubcommand.help", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.cli.benchmark.throughput", "names": [ "vllm.entrypoints.cli.benchmark.throughput.BenchmarkThroughputSubcommand" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/cli/benchmark/mm_processor.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.cli.benchmark.mm_processor.BenchmarkMMProcessorSubcommand", "methods": [ { "kind": "function", "name": "BenchmarkMMProcessorSubcommand.add_cli_args", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BenchmarkMMProcessorSubcommand.cmd", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BenchmarkMMProcessorSubcommand.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BenchmarkMMProcessorSubcommand.help", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.cli.benchmark.mm_processor", "names": [ "vllm.entrypoints.cli.benchmark.mm_processor.BenchmarkMMProcessorSubcommand" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/cli/benchmark/startup.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.cli.benchmark.startup.BenchmarkStartupSubcommand", "methods": [ { "kind": "function", "name": "BenchmarkStartupSubcommand.add_cli_args", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BenchmarkStartupSubcommand.cmd", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BenchmarkStartupSubcommand.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BenchmarkStartupSubcommand.help", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.cli.benchmark.startup", "names": [ "vllm.entrypoints.cli.benchmark.startup.BenchmarkStartupSubcommand" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/cli/benchmark/latency.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.cli.benchmark.latency.BenchmarkLatencySubcommand", "methods": [ { "kind": "function", "name": "BenchmarkLatencySubcommand.add_cli_args", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BenchmarkLatencySubcommand.cmd", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BenchmarkLatencySubcommand.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BenchmarkLatencySubcommand.help", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.cli.benchmark.latency", "names": [ "vllm.entrypoints.cli.benchmark.latency.BenchmarkLatencySubcommand" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/cli/benchmark/serve.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.cli.benchmark.serve.BenchmarkServingSubcommand", "methods": [ { "kind": "function", "name": "BenchmarkServingSubcommand.add_cli_args", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BenchmarkServingSubcommand.cmd", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BenchmarkServingSubcommand.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BenchmarkServingSubcommand.help", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.cli.benchmark.serve", "names": [ "vllm.entrypoints.cli.benchmark.serve.BenchmarkServingSubcommand" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/cli/benchmark/sweep.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.cli.benchmark.sweep.BenchmarkSweepSubcommand", "methods": [ { "kind": "function", "name": "BenchmarkSweepSubcommand.add_cli_args", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BenchmarkSweepSubcommand.cmd", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BenchmarkSweepSubcommand.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BenchmarkSweepSubcommand.help", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.cli.benchmark.sweep", "names": [ "vllm.entrypoints.cli.benchmark.sweep.BenchmarkSweepSubcommand" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/cli/benchmark/base.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.cli.benchmark.base.BenchmarkSubcommandBase", "methods": [ { "kind": "function", "name": "BenchmarkSubcommandBase.add_cli_args", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BenchmarkSubcommandBase.cmd", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BenchmarkSubcommandBase.help", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.cli.benchmark.base", "names": [ "vllm.entrypoints.cli.benchmark.base.BenchmarkSubcommandBase" ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/cli/benchmark/main.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.cli.benchmark.main.BenchmarkSubcommand", "methods": [ { "kind": "function", "name": "BenchmarkSubcommand.cmd", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BenchmarkSubcommand.validate", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BenchmarkSubcommand.subparser_init", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BenchmarkSubcommand.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BenchmarkSubcommand.help", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.cli.benchmark.main.cmd_init", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.cli.benchmark.main", "names": [ "vllm.entrypoints.cli.benchmark.main.BenchmarkSubcommand", "vllm.entrypoints.cli.benchmark.main.cmd_init" ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/cli/collect_env.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.cli.collect_env.CollectEnvSubcommand", "methods": [ { "kind": "function", "name": "CollectEnvSubcommand.cmd", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CollectEnvSubcommand.subparser_init", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CollectEnvSubcommand.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.cli.collect_env.cmd_init", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.cli.collect_env", "names": [ "vllm.entrypoints.cli.collect_env.CollectEnvSubcommand", "vllm.entrypoints.cli.collect_env.cmd_init" ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/cli/main.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.cli.main.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.cli.main.main", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.cli.main", "names": [ "vllm.entrypoints.cli.main.logger", "vllm.entrypoints.cli.main.main" ], "n_typable": 2, "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/cli/openai.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.cli.openai.chat", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.entrypoints.cli.openai.CompleteCommand", "methods": [ { "kind": "function", "name": "CompleteCommand.cmd", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompleteCommand.add_cli_args", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompleteCommand.subparser_init", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompleteCommand.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.cli.openai.cmd_init", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.entrypoints.cli.openai.ChatCommand", "methods": [ { "kind": "function", "name": "ChatCommand.cmd", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChatCommand.add_cli_args", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChatCommand.subparser_init", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCommand.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.cli.openai", "names": [ "vllm.entrypoints.cli.openai.ChatCommand", "vllm.entrypoints.cli.openai.CompleteCommand", "vllm.entrypoints.cli.openai.chat", "vllm.entrypoints.cli.openai.cmd_init" ], "n_typable": 17, "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 3, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_classes": 2, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/cli/run_batch.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.cli.run_batch.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.cli.run_batch.cmd_init", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.entrypoints.cli.run_batch.RunBatchSubcommand", "methods": [ { "kind": "function", "name": "RunBatchSubcommand.cmd", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RunBatchSubcommand.subparser_init", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RunBatchSubcommand.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.cli.run_batch", "names": [ "vllm.entrypoints.cli.run_batch.RunBatchSubcommand", "vllm.entrypoints.cli.run_batch.cmd_init", "vllm.entrypoints.cli.run_batch.logger" ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/cli/serve.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.cli.serve.ServeSubcommand", "methods": [ { "kind": "function", "name": "ServeSubcommand.cmd", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ServeSubcommand.validate", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ServeSubcommand.subparser_init", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ServeSubcommand.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.cli.serve.run_multi_api_server", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.cli.serve.DESCRIPTION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.entrypoints.cli.serve.run_headless", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.cli.serve.run_api_server_worker_proc", "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.entrypoints.cli.serve.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.cli.serve.cmd_init", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.cli.serve", "names": [ "vllm.entrypoints.cli.serve.DESCRIPTION", "vllm.entrypoints.cli.serve.ServeSubcommand", "vllm.entrypoints.cli.serve.cmd_init", "vllm.entrypoints.cli.serve.logger", "vllm.entrypoints.cli.serve.run_api_server_worker_proc", "vllm.entrypoints.cli.serve.run_headless", "vllm.entrypoints.cli.serve.run_multi_api_server" ], "n_typable": 18, "n_typed": 10, "n_any": 0, "n_untyped": 8, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 7, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/cli/types.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.cli.types.CLISubcommand", "methods": [ { "kind": "function", "name": "CLISubcommand.cmd", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CLISubcommand.validate", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CLISubcommand.subparser_init", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CLISubcommand.name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.cli.types", "names": [ "vllm.entrypoints.cli.types.CLISubcommand" ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/constants.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.constants.H11_MAX_INCOMPLETE_EVENT_SIZE_DEFAULT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.entrypoints.constants.H11_MAX_HEADER_COUNT_DEFAULT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.entrypoints.constants.MCP_PREFIX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.constants", "names": [ "vllm.entrypoints.constants.H11_MAX_HEADER_COUNT_DEFAULT", "vllm.entrypoints.constants.H11_MAX_INCOMPLETE_EVENT_SIZE_DEFAULT", "vllm.entrypoints.constants.MCP_PREFIX" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/grpc_server.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.grpc_server.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.grpc_server.VllmEngineServicer", "methods": [ { "kind": "function", "name": "VllmEngineServicer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmEngineServicer.Generate", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmEngineServicer.Embed", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmEngineServicer.HealthCheck", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmEngineServicer.Abort", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmEngineServicer.GetModelInfo", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmEngineServicer.GetServerInfo", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmEngineServicer._sampling_params_from_proto", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmEngineServicer._tokenization_kwargs_from_proto", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VllmEngineServicer._chunk_response", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VllmEngineServicer._complete_response", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VllmEngineServicer.async_llm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmEngineServicer.start_time", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 29, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 19, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.grpc_server.main", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.entrypoints.grpc_server.serve_grpc", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.grpc_server", "names": [ "vllm.entrypoints.grpc_server.VllmEngineServicer", "vllm.entrypoints.grpc_server.logger", "vllm.entrypoints.grpc_server.main", "vllm.entrypoints.grpc_server.serve_grpc" ], "n_typable": 36, "n_typed": 30, "n_any": 0, "n_untyped": 6, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 1, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 19, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/launcher.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.launcher.serve_http", "n_typed": 3, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.entrypoints.launcher.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.launcher.watchdog_loop", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.launcher.terminate_if_errored", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.entrypoints.launcher", "names": [ "vllm.entrypoints.launcher.logger", "vllm.entrypoints.launcher.serve_http", "vllm.entrypoints.launcher.terminate_if_errored", "vllm.entrypoints.launcher.watchdog_loop" ], "n_typable": 12, "n_typed": 7, "n_any": 1, "n_untyped": 4, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 8, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/logger.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.logger.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.logger.RequestLogger", "methods": [ { "kind": "function", "name": "RequestLogger.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RequestLogger.log_inputs", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "RequestLogger.log_outputs", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RequestLogger.max_log_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 13, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.logger", "names": [ "vllm.entrypoints.logger.RequestLogger", "vllm.entrypoints.logger.logger" ], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 13, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/mcp/tool.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.mcp.tool.MIN_GPT_OSS_VERSION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.entrypoints.mcp.tool.HarmonyPythonTool", "methods": [ { "kind": "function", "name": "HarmonyPythonTool.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HarmonyPythonTool.validate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HarmonyPythonTool.get_result", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HarmonyPythonTool.get_result_parsable_context", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "HarmonyPythonTool.tool_config", "n_typed": 0, "n_any": 1, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "HarmonyPythonTool.enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HarmonyPythonTool.python_tool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 2, "n_any": 3, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_attrs": 2, "n_properties": 1 }, { "kind": "class", "name": "vllm.entrypoints.mcp.tool.HarmonyBrowserTool", "methods": [ { "kind": "function", "name": "HarmonyBrowserTool.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HarmonyBrowserTool.get_result", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HarmonyBrowserTool.get_result_parsable_context", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "HarmonyBrowserTool.tool_config", "n_typed": 0, "n_any": 1, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "HarmonyBrowserTool.enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HarmonyBrowserTool.browser_tool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 2, "n_any": 3, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 2, "n_properties": 1 }, { "kind": "function", "name": "vllm.entrypoints.mcp.tool.validate_gpt_oss_install", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.entrypoints.mcp.tool.Tool", "methods": [ { "kind": "function", "name": "Tool.get_result", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Tool.get_result_parsable_context", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 2, "n_any": 2, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.mcp.tool.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.mcp.tool", "names": [ "vllm.entrypoints.mcp.tool.HarmonyBrowserTool", "vllm.entrypoints.mcp.tool.HarmonyPythonTool", "vllm.entrypoints.mcp.tool.MIN_GPT_OSS_VERSION", "vllm.entrypoints.mcp.tool.Tool", "vllm.entrypoints.mcp.tool.logger", "vllm.entrypoints.mcp.tool.validate_gpt_oss_install" ], "n_typable": 23, "n_typed": 6, "n_any": 8, "n_untyped": 9, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 6, "n_classes": 3, "n_attrs": 6, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/mcp/tool_server.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.mcp.tool_server.list_server_and_tools", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.mcp.tool_server.post_process_tools_description", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.mcp.tool_server.trim_schema", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.entrypoints.mcp.tool_server.DemoToolServer", "methods": [ { "kind": "function", "name": "DemoToolServer.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DemoToolServer.init_and_validate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DemoToolServer.has_tool", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DemoToolServer.get_tool_description", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DemoToolServer.new_session", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DemoToolServer.tools", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.mcp.tool_server.MCPToolServer", "methods": [ { "kind": "function", "name": "MCPToolServer.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MCPToolServer.add_tool_server", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MCPToolServer.has_tool", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MCPToolServer.get_tool_description", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MCPToolServer.new_session", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MCPToolServer.harmony_tool_descriptions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 7, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.mcp.tool_server.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.mcp.tool_server.ToolServer", "methods": [ { "kind": "function", "name": "ToolServer.has_tool", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ToolServer.get_tool_description", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ToolServer.new_session", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.mcp.tool_server", "names": [ "vllm.entrypoints.mcp.tool_server.DemoToolServer", "vllm.entrypoints.mcp.tool_server.MCPToolServer", "vllm.entrypoints.mcp.tool_server.ToolServer", "vllm.entrypoints.mcp.tool_server.list_server_and_tools", "vllm.entrypoints.mcp.tool_server.logger", "vllm.entrypoints.mcp.tool_server.post_process_tools_description", "vllm.entrypoints.mcp.tool_server.trim_schema" ], "n_typable": 41, "n_typed": 31, "n_any": 0, "n_untyped": 10, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 3, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 19, "n_classes": 3, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/api_server.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.openai.api_server.build_async_engine_client_from_engine_args", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.entrypoints.openai.api_server.build_async_engine_client", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.entrypoints.openai.api_server.parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.api_server.validate_api_server_args", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.api_server.setup_server", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.api_server.create_server_unix_socket", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.api_server.init_app_state", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.entrypoints.openai.api_server.args", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.api_server.prometheus_multiproc_dir", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.api_server.run_server_worker", "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.entrypoints.openai.api_server.build_app", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.api_server.create_server_socket", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.api_server.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.api_server.run_server", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.api_server", "names": [ "vllm.entrypoints.openai.api_server.args", "vllm.entrypoints.openai.api_server.build_app", "vllm.entrypoints.openai.api_server.build_async_engine_client", "vllm.entrypoints.openai.api_server.build_async_engine_client_from_engine_args", "vllm.entrypoints.openai.api_server.create_server_socket", "vllm.entrypoints.openai.api_server.create_server_unix_socket", "vllm.entrypoints.openai.api_server.init_app_state", "vllm.entrypoints.openai.api_server.logger", "vllm.entrypoints.openai.api_server.parser", "vllm.entrypoints.openai.api_server.prometheus_multiproc_dir", "vllm.entrypoints.openai.api_server.run_server", "vllm.entrypoints.openai.api_server.run_server_worker", "vllm.entrypoints.openai.api_server.setup_server", "vllm.entrypoints.openai.api_server.validate_api_server_args" ], "n_typable": 39, "n_typed": 25, "n_any": 0, "n_untyped": 14, "n_functions": 10, "n_function_overloads": 10, "n_function_params": 25, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/chat_completion/api_router.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.openai.chat_completion.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.chat_completion.api_router.chat", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.chat_completion.api_router.render_chat_completion", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.chat_completion.api_router.create_chat_completion", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.chat_completion.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.chat_completion.api_router.ENDPOINT_LOAD_METRICS_FORMAT_HEADER_LABEL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.chat_completion.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.chat_completion.api_router", "names": [ "vllm.entrypoints.openai.chat_completion.api_router.ENDPOINT_LOAD_METRICS_FORMAT_HEADER_LABEL", "vllm.entrypoints.openai.chat_completion.api_router.attach_router", "vllm.entrypoints.openai.chat_completion.api_router.chat", "vllm.entrypoints.openai.chat_completion.api_router.create_chat_completion", "vllm.entrypoints.openai.chat_completion.api_router.logger", "vllm.entrypoints.openai.chat_completion.api_router.render_chat_completion", "vllm.entrypoints.openai.chat_completion.api_router.router" ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/chat_completion/protocol.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.openai.chat_completion.protocol.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionToolsParam", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCompletionToolsParam.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionToolsParam.function", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCompletionResponse.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponse.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponse.created", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponse.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponse.choices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponse.service_tier", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponse.system_fingerprint", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponse.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponse.prompt_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponse.prompt_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponse.kv_transfer_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionNamedToolChoiceParam", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCompletionNamedToolChoiceParam.function", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionNamedToolChoiceParam.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.chat_completion.protocol.ChatMessage", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatMessage.role", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatMessage.content", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatMessage.refusal", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatMessage.annotations", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatMessage.audio", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatMessage.function_call", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatMessage.tool_calls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatMessage.reasoning", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionLogProbs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCompletionLogProbs.content", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionNamedFunction", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCompletionNamedFunction.name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionResponseChoice", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCompletionResponseChoice.index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponseChoice.message", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponseChoice.logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponseChoice.finish_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponseChoice.stop_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponseChoice.token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionRequest", "methods": [ { "kind": "function", "name": "ChatCompletionRequest.build_chat_params", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ChatCompletionRequest.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChatCompletionRequest.to_beam_search_params", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ChatCompletionRequest.to_sampling_params", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ChatCompletionRequest.validate_response_format", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChatCompletionRequest.validate_stream_options", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChatCompletionRequest.check_logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChatCompletionRequest.check_structured_outputs_count", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChatCompletionRequest.check_tool_usage", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChatCompletionRequest.check_generation_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChatCompletionRequest.check_cache_salt_support", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChatCompletionRequest.check_system_message_content_type", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCompletionRequest.messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.frequency_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.logit_bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.top_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.max_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.max_completion_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.n", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.presence_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.response_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.seed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.stop", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.stream_options", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.temperature", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.top_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.tools", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.tool_choice", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.reasoning_effort", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.include_reasoning", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.parallel_tool_calls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.user", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.use_beam_search", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.top_k", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.min_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.repetition_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.length_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.stop_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.include_stop_str_in_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.ignore_eos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.min_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.skip_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.spaces_between_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.truncate_prompt_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.prompt_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.allowed_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.bad_words", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.echo", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.add_generation_prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.continue_final_message", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.add_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.documents", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.chat_template", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.chat_template_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.mm_processor_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.structured_outputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.priority", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.request_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.return_tokens_as_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.return_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.cache_salt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.kv_transfer_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.vllm_xargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest.repetition_detection", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionRequest._DEFAULT_SAMPLING_PARAMS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 83, "n_typed": 67, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 15, "n_attrs": 56, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionStreamResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCompletionStreamResponse.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionStreamResponse.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionStreamResponse.created", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionStreamResponse.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionStreamResponse.choices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionStreamResponse.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionStreamResponse.prompt_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionLogProb", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCompletionLogProb.token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionLogProb.logprob", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionLogProb.bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionLogProbsContent", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCompletionLogProbsContent.field_names", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionLogProbsContent.top_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionResponseStreamChoice", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatCompletionResponseStreamChoice.index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponseStreamChoice.delta", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponseStreamChoice.logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponseStreamChoice.finish_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponseStreamChoice.stop_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatCompletionResponseStreamChoice.token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.chat_completion.protocol", "names": [ "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionLogProb", "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionLogProbs", "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionLogProbsContent", "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionNamedFunction", "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionNamedToolChoiceParam", "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionRequest", "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionResponse", "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionResponseChoice", "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionResponseStreamChoice", "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionStreamResponse", "vllm.entrypoints.openai.chat_completion.protocol.ChatCompletionToolsParam", "vllm.entrypoints.openai.chat_completion.protocol.ChatMessage", "vllm.entrypoints.openai.chat_completion.protocol.logger" ], "n_typable": 133, "n_typed": 116, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 15, "n_classes": 12, "n_attrs": 106, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/chat_completion/serving.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.openai.chat_completion.serving.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.chat_completion.serving.OpenAIServingChat", "methods": [ { "kind": "function", "name": "OpenAIServingChat.__init__", "n_typed": 19, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 }, { "kind": "function", "name": "OpenAIServingChat.warmup", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OpenAIServingChat.render_chat_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingChat.create_chat_completion", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServingChat.get_chat_request_role", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingChat._bracket_level", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServingChat._filter_delta_text", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServingChat.extract_tool_call_required_streaming", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OpenAIServingChat.chat_completion_stream_generator", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "OpenAIServingChat.chat_completion_full_generator", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "OpenAIServingChat._get_top_logprobs", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OpenAIServingChat._create_chat_logprobs", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OpenAIServingChat._should_stream_with_auto_tool_parsing", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingChat._should_check_for_unstreamed_tool_arg_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServingChat._create_remaining_args_delta", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServingChat._make_request_with_harmony", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenAIServingChat.response_role", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.chat_template_content_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.trust_request_chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.default_chat_template_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.enable_log_outputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.enable_log_deltas", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.reasoning_parser_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.enable_auto_tools", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.tool_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.exclude_tools_when_tool_choice_none", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.enable_prompt_tokens_details", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.enable_force_include_usage", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.default_sampling_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.override_max_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.use_harmony", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.supports_browsing", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.browser_tool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.supports_code_interpreter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.python_tool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingChat.tool_call_id_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 102, "n_typed": 79, "n_any": 0, "n_untyped": 23, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 65, "n_attrs": 21, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.chat_completion.serving", "names": [ "vllm.entrypoints.openai.chat_completion.serving.OpenAIServingChat", "vllm.entrypoints.openai.chat_completion.serving.logger" ], "n_typable": 103, "n_typed": 79, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 65, "n_classes": 1, "n_attrs": 22, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/chat_completion/stream_harmony.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.openai.chat_completion.stream_harmony.TokenState", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TokenState.channel", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TokenState.recipient", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TokenState.text", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.chat_completion.stream_harmony.extract_harmony_streaming_delta", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.chat_completion.stream_harmony", "names": [ "vllm.entrypoints.openai.chat_completion.stream_harmony.TokenState", "vllm.entrypoints.openai.chat_completion.stream_harmony.extract_harmony_streaming_delta" ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/cli_args.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.openai.cli_args.create_parser_for_docs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.cli_args.BaseFrontendArgs", "methods": [ { "kind": "function", "name": "BaseFrontendArgs._customize_cli_kwargs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseFrontendArgs.add_cli_args", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseFrontendArgs.lora_modules", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.chat_template", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.chat_template_content_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.trust_request_chat_template", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.default_chat_template_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.response_role", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.return_tokens_as_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.disable_frontend_multiprocessing", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.enable_auto_tool_choice", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.exclude_tools_when_tool_choice_none", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.tool_call_parser", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.tool_parser_plugin", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.tool_server", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.log_config_file", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.max_log_len", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.enable_prompt_tokens_details", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.enable_server_load_tracking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.enable_force_include_usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.enable_tokenizer_info_endpoint", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.enable_log_outputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.enable_log_deltas", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.log_error_stack", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseFrontendArgs.tokens_only", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 27, "n_typed": 27, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 23, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.cli_args.FrontendArgs", "methods": [ { "kind": "function", "name": "FrontendArgs._customize_cli_kwargs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FrontendArgs.host", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.uds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.uvicorn_log_level", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.disable_uvicorn_access_log", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.disable_access_log_for_endpoints", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.allow_credentials", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.allowed_origins", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.allowed_methods", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.allowed_headers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.api_key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.ssl_keyfile", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.ssl_certfile", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.ssl_ca_certs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.enable_ssl_refresh", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.ssl_cert_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.ssl_ciphers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.root_path", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.middleware", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.enable_request_id_headers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.disable_fastapi_docs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.h11_max_incomplete_event_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.h11_max_header_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.enable_offline_docs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FrontendArgs.use_gpu_for_pooling_score", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 27, "n_typed": 27, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 25, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.cli_args.LoRAParserAction", "methods": [ { "kind": "function", "name": "LoRAParserAction.__call__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.cli_args.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.cli_args.make_arg_parser", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.cli_args.validate_parsed_serve_args", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.cli_args", "names": [ "vllm.entrypoints.openai.cli_args.BaseFrontendArgs", "vllm.entrypoints.openai.cli_args.FrontendArgs", "vllm.entrypoints.openai.cli_args.LoRAParserAction", "vllm.entrypoints.openai.cli_args.create_parser_for_docs", "vllm.entrypoints.openai.cli_args.logger", "vllm.entrypoints.openai.cli_args.make_arg_parser", "vllm.entrypoints.openai.cli_args.validate_parsed_serve_args" ], "n_typable": 65, "n_typed": 62, "n_any": 0, "n_untyped": 3, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 2, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_classes": 3, "n_attrs": 49, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/completion/api_router.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.openai.completion.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.completion.api_router.completion", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.completion.api_router.render_completion", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.completion.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.completion.api_router.ENDPOINT_LOAD_METRICS_FORMAT_HEADER_LABEL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.completion.api_router.create_completion", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.openai.completion.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.completion.api_router", "names": [ "vllm.entrypoints.openai.completion.api_router.ENDPOINT_LOAD_METRICS_FORMAT_HEADER_LABEL", "vllm.entrypoints.openai.completion.api_router.attach_router", "vllm.entrypoints.openai.completion.api_router.completion", "vllm.entrypoints.openai.completion.api_router.create_completion", "vllm.entrypoints.openai.completion.api_router.logger", "vllm.entrypoints.openai.completion.api_router.render_completion", "vllm.entrypoints.openai.completion.api_router.router" ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/completion/protocol.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.openai.completion.protocol.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.completion.protocol.CompletionLogProbs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CompletionLogProbs.text_offset", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionLogProbs.token_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionLogProbs.tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionLogProbs.top_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.completion.protocol.CompletionResponseChoice", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CompletionResponseChoice.index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponseChoice.text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponseChoice.logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponseChoice.finish_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponseChoice.stop_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponseChoice.token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponseChoice.prompt_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponseChoice.prompt_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.completion.protocol.CompletionResponseStreamChoice", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CompletionResponseStreamChoice.index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponseStreamChoice.text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponseStreamChoice.logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponseStreamChoice.finish_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponseStreamChoice.stop_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponseStreamChoice.prompt_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponseStreamChoice.token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.completion.protocol.CompletionResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CompletionResponse.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponse.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponse.created", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponse.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponse.choices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponse.service_tier", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponse.system_fingerprint", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponse.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionResponse.kv_transfer_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.completion.protocol.CompletionRequest", "methods": [ { "kind": "function", "name": "CompletionRequest.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompletionRequest.to_beam_search_params", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CompletionRequest.to_sampling_params", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CompletionRequest.validate_response_format", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompletionRequest.check_structured_outputs_count", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompletionRequest.check_logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompletionRequest.validate_stream_options", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompletionRequest.validate_prompt_and_prompt_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompletionRequest.check_cache_salt_support", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompletionRequest.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.echo", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.frequency_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.logit_bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.max_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.n", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.presence_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.seed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.stop", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.stream_options", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.suffix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.temperature", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.top_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.user", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.use_beam_search", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.top_k", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.min_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.repetition_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.length_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.stop_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.include_stop_str_in_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.ignore_eos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.min_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.skip_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.spaces_between_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.truncate_prompt_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.allowed_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.prompt_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.prompt_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.add_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.response_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.structured_outputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.priority", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.request_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.return_tokens_as_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.return_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.cache_salt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.kv_transfer_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.vllm_xargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest.repetition_detection", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequest._DEFAULT_SAMPLING_PARAMS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 64, "n_typed": 52, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 11, "n_attrs": 44, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.completion.protocol.CompletionStreamResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CompletionStreamResponse.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionStreamResponse.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionStreamResponse.created", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionStreamResponse.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionStreamResponse.choices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionStreamResponse.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.completion.protocol", "names": [ "vllm.entrypoints.openai.completion.protocol.CompletionLogProbs", "vllm.entrypoints.openai.completion.protocol.CompletionRequest", "vllm.entrypoints.openai.completion.protocol.CompletionResponse", "vllm.entrypoints.openai.completion.protocol.CompletionResponseChoice", "vllm.entrypoints.openai.completion.protocol.CompletionResponseStreamChoice", "vllm.entrypoints.openai.completion.protocol.CompletionStreamResponse", "vllm.entrypoints.openai.completion.protocol.logger" ], "n_typable": 99, "n_typed": 86, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 11, "n_classes": 6, "n_attrs": 79, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/completion/serving.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.openai.completion.serving.OpenAIServingCompletion", "methods": [ { "kind": "function", "name": "OpenAIServingCompletion.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "OpenAIServingCompletion.render_completion_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingCompletion.create_completion", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServingCompletion.completion_stream_generator", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "OpenAIServingCompletion.request_output_to_completion_response", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "OpenAIServingCompletion._create_completion_logprobs", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenAIServingCompletion.enable_prompt_tokens_details", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingCompletion.enable_force_include_usage", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingCompletion.default_sampling_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingCompletion.override_max_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 42, "n_typed": 37, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 32, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.completion.serving.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.completion.serving", "names": [ "vllm.entrypoints.openai.completion.serving.OpenAIServingCompletion", "vllm.entrypoints.openai.completion.serving.logger" ], "n_typable": 43, "n_typed": 37, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 32, "n_classes": 1, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/engine/protocol.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.openai.engine.protocol.AnyResponseFormat", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.LogitsProcessorConstructor", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LogitsProcessorConstructor.qualname", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LogitsProcessorConstructor.args", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LogitsProcessorConstructor.kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LogitsProcessorConstructor.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.ModelList", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelList.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelList.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.JsonSchemaResponseFormat", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "JsonSchemaResponseFormat.name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "JsonSchemaResponseFormat.description", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "JsonSchemaResponseFormat.json_schema", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "JsonSchemaResponseFormat.strict", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.FunctionCall", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FunctionCall.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FunctionCall.name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FunctionCall.arguments", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.ModelCard", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelCard.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelCard.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelCard.created", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelCard.owned_by", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelCard.root", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelCard.parent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelCard.max_model_len", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelCard.permission", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.ExtractedToolCallInformation", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ExtractedToolCallInformation.tools_called", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ExtractedToolCallInformation.tool_calls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ExtractedToolCallInformation.content", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.engine.protocol.get_logits_processors", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.GenerateRequest", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "GenerateRequest.request_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.sampling_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.stream_options", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.cache_salt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.priority", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.kv_transfer_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.engine.protocol.LogitsProcessors", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.StreamOptions", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "StreamOptions.include_usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StreamOptions.continuous_usage_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.RequestResponseMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RequestResponseMetadata.request_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RequestResponseMetadata.final_usage_info", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.LegacyStructuralTag", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LegacyStructuralTag.begin", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LegacyStructuralTag.structural_tag_schema", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LegacyStructuralTag.end", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.DeltaToolCall", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DeltaToolCall.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeltaToolCall.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeltaToolCall.index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeltaToolCall.function", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.LegacyStructuralTagResponseFormat", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LegacyStructuralTagResponseFormat.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LegacyStructuralTagResponseFormat.structures", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LegacyStructuralTagResponseFormat.triggers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.engine.protocol.AnyStructuralTagResponseFormat", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.StructuralTagResponseFormat", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "StructuralTagResponseFormat.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StructuralTagResponseFormat.format", "n_typed": 0, "n_any": 1, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.ErrorResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ErrorResponse.error", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.ToolCall", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ToolCall.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ToolCall.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ToolCall.function", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.PromptTokenUsageInfo", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PromptTokenUsageInfo.cached_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.ErrorInfo", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ErrorInfo.message", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ErrorInfo.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ErrorInfo.param", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ErrorInfo.code", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.OpenAIBaseModel", "methods": [ { "kind": "function", "name": "OpenAIBaseModel.__log_extra_fields__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenAIBaseModel.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIBaseModel.field_names", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 1, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.ModelPermission", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelPermission.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelPermission.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelPermission.created", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelPermission.allow_create_engine", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelPermission.allow_sampling", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelPermission.allow_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelPermission.allow_search_indices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelPermission.allow_view", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelPermission.allow_fine_tuning", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelPermission.organization", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelPermission.group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelPermission.is_blocking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.DeltaFunctionCall", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DeltaFunctionCall.name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeltaFunctionCall.arguments", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.UsageInfo", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "UsageInfo.prompt_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageInfo.total_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageInfo.completion_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageInfo.prompt_tokens_details", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.ResponseFormat", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ResponseFormat.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseFormat.json_schema", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.FunctionDefinition", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FunctionDefinition.name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FunctionDefinition.description", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FunctionDefinition.parameters", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.engine.protocol.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.protocol.DeltaMessage", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DeltaMessage.role", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeltaMessage.content", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeltaMessage.reasoning", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeltaMessage.tool_calls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.engine.protocol", "names": [ "vllm.entrypoints.openai.engine.protocol.AnyResponseFormat", "vllm.entrypoints.openai.engine.protocol.AnyStructuralTagResponseFormat", "vllm.entrypoints.openai.engine.protocol.DeltaFunctionCall", "vllm.entrypoints.openai.engine.protocol.DeltaMessage", "vllm.entrypoints.openai.engine.protocol.DeltaToolCall", "vllm.entrypoints.openai.engine.protocol.ErrorInfo", "vllm.entrypoints.openai.engine.protocol.ErrorResponse", "vllm.entrypoints.openai.engine.protocol.ExtractedToolCallInformation", "vllm.entrypoints.openai.engine.protocol.FunctionCall", "vllm.entrypoints.openai.engine.protocol.FunctionDefinition", "vllm.entrypoints.openai.engine.protocol.GenerateRequest", "vllm.entrypoints.openai.engine.protocol.JsonSchemaResponseFormat", "vllm.entrypoints.openai.engine.protocol.LegacyStructuralTag", "vllm.entrypoints.openai.engine.protocol.LegacyStructuralTagResponseFormat", "vllm.entrypoints.openai.engine.protocol.LogitsProcessorConstructor", "vllm.entrypoints.openai.engine.protocol.LogitsProcessors", "vllm.entrypoints.openai.engine.protocol.ModelCard", "vllm.entrypoints.openai.engine.protocol.ModelList", "vllm.entrypoints.openai.engine.protocol.ModelPermission", "vllm.entrypoints.openai.engine.protocol.OpenAIBaseModel", "vllm.entrypoints.openai.engine.protocol.PromptTokenUsageInfo", "vllm.entrypoints.openai.engine.protocol.RequestResponseMetadata", "vllm.entrypoints.openai.engine.protocol.ResponseFormat", "vllm.entrypoints.openai.engine.protocol.StreamOptions", "vllm.entrypoints.openai.engine.protocol.StructuralTagResponseFormat", "vllm.entrypoints.openai.engine.protocol.ToolCall", "vllm.entrypoints.openai.engine.protocol.UsageInfo", "vllm.entrypoints.openai.engine.protocol.get_logits_processors", "vllm.entrypoints.openai.engine.protocol.logger" ], "n_typable": 97, "n_typed": 90, "n_any": 1, "n_untyped": 6, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_classes": 24, "n_attrs": 92, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/engine/serving.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.openai.engine.serving.RequestT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.serving.GenerationError", "methods": [ { "kind": "function", "name": "GenerationError.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GenerationError.status_code", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.serving.RendererRequest", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.engine.serving.AnyRequest", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.serving.RendererChatRequest", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.serving.ServeContext", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ServeContext.request", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ServeContext.raw_request", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ServeContext.model_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ServeContext.request_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ServeContext.created_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ServeContext.lora_request", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ServeContext.engine_prompts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ServeContext.result_generator", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ServeContext.final_res_batch", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ServeContext.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.engine.serving.CompletionLikeRequest", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.engine.serving.AnyResponse", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.engine.serving.OpenAIServing", "methods": [ { "kind": "function", "name": "OpenAIServing.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OpenAIServing.beam_search", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OpenAIServing._preprocess", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._build_response", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing.handle", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._pipeline", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._validate_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._create_pooling_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._prepare_generators", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._collect_batch", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing.create_error_response", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OpenAIServing.create_streaming_error_response", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OpenAIServing._raise_if_error", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServing._convert_generation_error_to_response", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._convert_generation_error_to_streaming_response", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._check_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._get_active_default_mm_loras", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._maybe_get_adapters", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServing._get_message_types", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._validate_input", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServing._validate_chat_template", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServing._prepare_extra_chat_template_kwargs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServing._preprocess_completion", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServing._preprocess_cmpl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServing._preprocess_chat", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "OpenAIServing._extract_prompt_components", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._extract_prompt_text", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._extract_prompt_len", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._render_next_turn", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "OpenAIServing._generate_with_builtin_tools", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "OpenAIServing._log_inputs", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OpenAIServing._get_trace_headers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._base_request_id", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServing._get_data_parallel_rank", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServing._parse_tool_calls_from_content", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OpenAIServing._get_decoded_token", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OpenAIServing._is_model_supported", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenAIServing.request_id_prefix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServing.engine_client", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServing.models", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServing.request_logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServing.return_tokens_as_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServing.log_error_stack", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServing.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServing.renderer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServing.io_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServing.input_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 136, "n_typed": 121, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 37, "n_method_overloads": 37, "n_method_params": 89, "n_attrs": 10, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.engine.serving.clamp_prompt_logprobs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.engine.serving.SpeechToTextRequest", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.engine.serving.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.engine.serving.ChatLikeRequest", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.engine.serving", "names": [ "vllm.entrypoints.openai.engine.serving.AnyRequest", "vllm.entrypoints.openai.engine.serving.AnyResponse", "vllm.entrypoints.openai.engine.serving.ChatLikeRequest", "vllm.entrypoints.openai.engine.serving.CompletionLikeRequest", "vllm.entrypoints.openai.engine.serving.GenerationError", "vllm.entrypoints.openai.engine.serving.OpenAIServing", "vllm.entrypoints.openai.engine.serving.RendererChatRequest", "vllm.entrypoints.openai.engine.serving.RendererRequest", "vllm.entrypoints.openai.engine.serving.RequestT", "vllm.entrypoints.openai.engine.serving.ServeContext", "vllm.entrypoints.openai.engine.serving.SpeechToTextRequest", "vllm.entrypoints.openai.engine.serving.clamp_prompt_logprobs", "vllm.entrypoints.openai.engine.serving.logger" ], "n_typable": 148, "n_typed": 129, "n_any": 0, "n_untyped": 19, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 38, "n_method_overloads": 38, "n_method_params": 90, "n_classes": 5, "n_attrs": 28, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/generate/api_router.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.openai.generate.api_router.register_generate_api_routers", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.generate.api_router.RequestLogger", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.generate.api_router.init_generate_state", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.generate.api_router", "names": [ "vllm.entrypoints.openai.generate.api_router.RequestLogger", "vllm.entrypoints.openai.generate.api_router.init_generate_state", "vllm.entrypoints.openai.generate.api_router.register_generate_api_routers" ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/models/api_router.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.openai.models.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.models.api_router.models", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.models.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.models.api_router.show_available_models", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.models.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.models.api_router", "names": [ "vllm.entrypoints.openai.models.api_router.attach_router", "vllm.entrypoints.openai.models.api_router.logger", "vllm.entrypoints.openai.models.api_router.models", "vllm.entrypoints.openai.models.api_router.router", "vllm.entrypoints.openai.models.api_router.show_available_models" ], "n_typable": 8, "n_typed": 4, "n_any": 0, "n_untyped": 4, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/models/protocol.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.openai.models.protocol.BaseModelPath", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseModelPath.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseModelPath.model_path", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.models.protocol.LoRAModulePath", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LoRAModulePath.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoRAModulePath.path", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoRAModulePath.base_model_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.models.protocol", "names": [ "vllm.entrypoints.openai.models.protocol.BaseModelPath", "vllm.entrypoints.openai.models.protocol.LoRAModulePath" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 2, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/models/serving.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.openai.models.serving.create_error_response", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.entrypoints.openai.models.serving.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.models.serving.OpenAIServingModels", "methods": [ { "kind": "function", "name": "OpenAIServingModels.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServingModels.init_static_loras", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OpenAIServingModels.is_base_model", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingModels.model_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingModels.show_available_models", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OpenAIServingModels.load_lora_adapter", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServingModels.unload_lora_adapter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingModels._check_load_lora_adapter_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingModels._check_unload_lora_adapter_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingModels.resolve_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenAIServingModels.engine_client", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingModels.base_model_paths", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingModels.static_lora_modules", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingModels.lora_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingModels.lora_id_counter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingModels.lora_resolvers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingModels.lora_resolver_lock", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingModels.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingModels.renderer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingModels.io_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingModels.input_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 21, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 11, "n_attrs": 11, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.models.serving", "names": [ "vllm.entrypoints.openai.models.serving.OpenAIServingModels", "vllm.entrypoints.openai.models.serving.create_error_response", "vllm.entrypoints.openai.models.serving.logger" ], "n_typable": 37, "n_typed": 25, "n_any": 0, "n_untyped": 12, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 11, "n_classes": 1, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/orca_metrics.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.openai.orca_metrics.metrics_header", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.orca_metrics.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.orca_metrics.create_orca_header", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.orca_metrics.get_named_metrics_from_prometheus", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.orca_metrics", "names": [ "vllm.entrypoints.openai.orca_metrics.create_orca_header", "vllm.entrypoints.openai.orca_metrics.get_named_metrics_from_prometheus", "vllm.entrypoints.openai.orca_metrics.logger", "vllm.entrypoints.openai.orca_metrics.metrics_header" ], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/parser/harmony_utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.openai.parser.harmony_utils.MCP_BUILTIN_TOOLS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.harmony_utils.get_user_message", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.harmony_utils.get_developer_message", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.harmony_utils.get_streamable_parser_for_assistant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.harmony_utils.flatten_chat_text_content", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.harmony_utils.render_for_completion", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.harmony_utils.has_custom_tools", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.harmony_utils.get_encoding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.harmony_utils.auto_drop_analysis_messages", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.parser.harmony_utils.REASONING_EFFORT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.harmony_utils.parse_chat_inputs_to_harmony_messages", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.harmony_utils.get_stop_tokens_for_assistant_actions", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.harmony_utils.parse_output_into_messages", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.harmony_utils.create_tool_definition", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.harmony_utils.parse_chat_input_to_harmony_message", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.openai.parser.harmony_utils.BUILTIN_TOOL_TO_MCP_SERVER_LABEL", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.harmony_utils.parse_chat_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.harmony_utils.get_system_message", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "attr", "name": "vllm.entrypoints.openai.parser.harmony_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.parser.harmony_utils", "names": [ "vllm.entrypoints.openai.parser.harmony_utils.BUILTIN_TOOL_TO_MCP_SERVER_LABEL", "vllm.entrypoints.openai.parser.harmony_utils.MCP_BUILTIN_TOOLS", "vllm.entrypoints.openai.parser.harmony_utils.REASONING_EFFORT", "vllm.entrypoints.openai.parser.harmony_utils.auto_drop_analysis_messages", "vllm.entrypoints.openai.parser.harmony_utils.create_tool_definition", "vllm.entrypoints.openai.parser.harmony_utils.flatten_chat_text_content", "vllm.entrypoints.openai.parser.harmony_utils.get_developer_message", "vllm.entrypoints.openai.parser.harmony_utils.get_encoding", "vllm.entrypoints.openai.parser.harmony_utils.get_stop_tokens_for_assistant_actions", "vllm.entrypoints.openai.parser.harmony_utils.get_streamable_parser_for_assistant", "vllm.entrypoints.openai.parser.harmony_utils.get_system_message", "vllm.entrypoints.openai.parser.harmony_utils.get_user_message", "vllm.entrypoints.openai.parser.harmony_utils.has_custom_tools", "vllm.entrypoints.openai.parser.harmony_utils.logger", "vllm.entrypoints.openai.parser.harmony_utils.parse_chat_input_to_harmony_message", "vllm.entrypoints.openai.parser.harmony_utils.parse_chat_inputs_to_harmony_messages", "vllm.entrypoints.openai.parser.harmony_utils.parse_chat_output", "vllm.entrypoints.openai.parser.harmony_utils.parse_output_into_messages", "vllm.entrypoints.openai.parser.harmony_utils.render_for_completion" ], "n_typable": 39, "n_typed": 35, "n_any": 0, "n_untyped": 4, "n_functions": 15, "n_function_overloads": 15, "n_function_params": 21, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/parser/responses_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.openai.parser.responses_parser.ResponsesParser", "methods": [ { "kind": "function", "name": "ResponsesParser.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ResponsesParser.process", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ResponsesParser.make_response_output_items_from_parsable_context", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ResponsesParser.response_messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesParser.num_init_messages", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesParser.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesParser.request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesParser.reasoning_parser_instance", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesParser.tool_parser_instance", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesParser.finish_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 16, "n_typed": 10, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.parser.responses_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.parser.responses_parser.get_responses_parser_for_simple_context", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.parser.responses_parser", "names": [ "vllm.entrypoints.openai.parser.responses_parser.ResponsesParser", "vllm.entrypoints.openai.parser.responses_parser.get_responses_parser_for_simple_context", "vllm.entrypoints.openai.parser.responses_parser.logger" ], "n_typable": 23, "n_typed": 15, "n_any": 0, "n_untyped": 8, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 5, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_classes": 1, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/realtime/api_router.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.openai.realtime.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.realtime.api_router.realtime_endpoint", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.realtime.api_router.RequestLogger", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.realtime.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.realtime.api_router.init_realtime_state", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.entrypoints.openai.realtime.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.realtime.api_router", "names": [ "vllm.entrypoints.openai.realtime.api_router.RequestLogger", "vllm.entrypoints.openai.realtime.api_router.attach_router", "vllm.entrypoints.openai.realtime.api_router.init_realtime_state", "vllm.entrypoints.openai.realtime.api_router.logger", "vllm.entrypoints.openai.realtime.api_router.realtime_endpoint", "vllm.entrypoints.openai.realtime.api_router.router" ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/realtime/connection.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.openai.realtime.connection.RealtimeConnection", "methods": [ { "kind": "function", "name": "RealtimeConnection.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RealtimeConnection.handle_connection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RealtimeConnection._check_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RealtimeConnection.handle_event", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RealtimeConnection.audio_stream_generator", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RealtimeConnection.start_generation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RealtimeConnection._run_generation", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RealtimeConnection.send", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RealtimeConnection.send_error", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RealtimeConnection.cleanup", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RealtimeConnection.websocket", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RealtimeConnection.connection_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RealtimeConnection.serving", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RealtimeConnection.audio_queue", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RealtimeConnection.generation_task", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 24, "n_typed": 13, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 9, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.realtime.connection.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.realtime.connection", "names": [ "vllm.entrypoints.openai.realtime.connection.RealtimeConnection", "vllm.entrypoints.openai.realtime.connection.logger" ], "n_typable": 25, "n_typed": 13, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 9, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/realtime/protocol.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.openai.realtime.protocol.InputAudioBufferAppend", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "InputAudioBufferAppend.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputAudioBufferAppend.audio", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.realtime.protocol.SessionUpdate", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SessionUpdate.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SessionUpdate.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.realtime.protocol.TranscriptionDelta", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TranscriptionDelta.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionDelta.delta", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.realtime.protocol.ErrorEvent", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ErrorEvent.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ErrorEvent.error", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ErrorEvent.code", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.realtime.protocol.TranscriptionDone", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TranscriptionDone.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionDone.text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionDone.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.realtime.protocol.InputAudioBufferCommit", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "InputAudioBufferCommit.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputAudioBufferCommit.final", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.realtime.protocol.SessionCreated", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SessionCreated.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SessionCreated.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SessionCreated.created", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.realtime.protocol", "names": [ "vllm.entrypoints.openai.realtime.protocol.ErrorEvent", "vllm.entrypoints.openai.realtime.protocol.InputAudioBufferAppend", "vllm.entrypoints.openai.realtime.protocol.InputAudioBufferCommit", "vllm.entrypoints.openai.realtime.protocol.SessionCreated", "vllm.entrypoints.openai.realtime.protocol.SessionUpdate", "vllm.entrypoints.openai.realtime.protocol.TranscriptionDelta", "vllm.entrypoints.openai.realtime.protocol.TranscriptionDone" ], "n_typable": 17, "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 7, "n_attrs": 17, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/realtime/serving.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.openai.realtime.serving.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.realtime.serving.OpenAIServingRealtime", "methods": [ { "kind": "function", "name": "OpenAIServingRealtime.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OpenAIServingRealtime.transcribe_realtime", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "OpenAIServingRealtime.model_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "OpenAIServingRealtime.task_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 1, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.realtime.serving", "names": [ "vllm.entrypoints.openai.realtime.serving.OpenAIServingRealtime", "vllm.entrypoints.openai.realtime.serving.logger" ], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_classes": 1, "n_attrs": 2, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/responses/api_router.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.openai.responses.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.api_router.responses", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.api_router.retrieve_responses", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.api_router.cancel_responses", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.openai.responses.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.api_router.create_responses", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.responses.api_router", "names": [ "vllm.entrypoints.openai.responses.api_router.attach_router", "vllm.entrypoints.openai.responses.api_router.cancel_responses", "vllm.entrypoints.openai.responses.api_router.create_responses", "vllm.entrypoints.openai.responses.api_router.logger", "vllm.entrypoints.openai.responses.api_router.responses", "vllm.entrypoints.openai.responses.api_router.retrieve_responses", "vllm.entrypoints.openai.responses.api_router.router" ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 10, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/responses/context.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.openai.responses.context.StreamingHarmonyContext", "methods": [ { "kind": "function", "name": "StreamingHarmonyContext.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StreamingHarmonyContext.append_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingHarmonyContext.append_tool_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingHarmonyContext.is_expecting_start", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StreamingHarmonyContext.is_assistant_action_turn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StreamingHarmonyContext.render_for_completion", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "StreamingHarmonyContext.messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "StreamingHarmonyContext.last_output", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StreamingHarmonyContext.parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StreamingHarmonyContext.encoding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StreamingHarmonyContext.last_tok", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StreamingHarmonyContext.first_tok_of_message", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StreamingHarmonyContext.last_content_delta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 8, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 4, "n_attrs": 6, "n_properties": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.context.ParsableContext", "methods": [ { "kind": "function", "name": "ParsableContext.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "ParsableContext.append_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParsableContext.append_tool_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParsableContext.need_builtin_tool_call", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParsableContext.call_python_tool", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ParsableContext.call_search_tool", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ParsableContext.call_container_tool", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ParsableContext.call_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParsableContext.render_for_completion", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParsableContext.init_tool_sessions", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ParsableContext.cleanup_session", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ParsableContext.num_prompt_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ParsableContext.num_output_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ParsableContext.num_cached_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ParsableContext.num_reasoning_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ParsableContext.all_turn_metrics", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParsableContext.parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ParsableContext.tool_parser_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ParsableContext.request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ParsableContext.available_tools", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ParsableContext.called_tools", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParsableContext.tool_dicts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ParsableContext.chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ParsableContext.chat_template_content_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParsableContext.input_messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParsableContext.output_messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 48, "n_typed": 33, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 22, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.context.SimpleContext", "methods": [ { "kind": "function", "name": "SimpleContext.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SimpleContext.append_output", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SimpleContext.append_tool_output", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SimpleContext.need_builtin_tool_call", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SimpleContext.call_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SimpleContext.render_for_completion", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SimpleContext.init_tool_sessions", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SimpleContext.cleanup_session", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "SimpleContext.output_messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "SimpleContext.final_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "SimpleContext.last_output", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SimpleContext.num_prompt_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SimpleContext.num_output_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SimpleContext.num_cached_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SimpleContext.num_reasoning_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SimpleContext.all_turn_metrics", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SimpleContext.input_messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 23, "n_typed": 14, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 6, "n_attrs": 7, "n_properties": 2 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.context.ConversationContext", "methods": [ { "kind": "function", "name": "ConversationContext.append_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConversationContext.append_tool_output", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConversationContext.call_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConversationContext.need_builtin_tool_call", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConversationContext.render_for_completion", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConversationContext.init_tool_sessions", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ConversationContext.cleanup_session", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 13, "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.context.HarmonyContext", "methods": [ { "kind": "function", "name": "HarmonyContext.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HarmonyContext._update_num_reasoning_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HarmonyContext.append_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HarmonyContext.append_tool_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HarmonyContext._update_prefill_token_usage", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HarmonyContext._update_decode_token_usage", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HarmonyContext.need_builtin_tool_call", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HarmonyContext.call_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HarmonyContext.render_for_completion", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HarmonyContext.call_search_tool", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HarmonyContext.call_python_tool", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HarmonyContext.init_tool_sessions", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "HarmonyContext.call_container_tool", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HarmonyContext.cleanup_session", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "HarmonyContext.messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "HarmonyContext.finish_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HarmonyContext.available_tools", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HarmonyContext.called_tools", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HarmonyContext.parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HarmonyContext.num_init_messages", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HarmonyContext.num_prompt_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HarmonyContext.num_output_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HarmonyContext.num_cached_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HarmonyContext.num_reasoning_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HarmonyContext.num_tool_output_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HarmonyContext.current_turn_metrics", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HarmonyContext.all_turn_metrics", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HarmonyContext.is_first_turn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HarmonyContext.first_tok_of_message", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 47, "n_typed": 31, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 18, "n_attrs": 14, "n_properties": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.context.TurnMetrics", "methods": [ { "kind": "function", "name": "TurnMetrics.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "TurnMetrics.reset", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TurnMetrics.copy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TurnMetrics.input_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TurnMetrics.output_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TurnMetrics.cached_input_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TurnMetrics.tool_output_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.responses.context.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.responses.context", "names": [ "vllm.entrypoints.openai.responses.context.ConversationContext", "vllm.entrypoints.openai.responses.context.HarmonyContext", "vllm.entrypoints.openai.responses.context.ParsableContext", "vllm.entrypoints.openai.responses.context.SimpleContext", "vllm.entrypoints.openai.responses.context.StreamingHarmonyContext", "vllm.entrypoints.openai.responses.context.TurnMetrics", "vllm.entrypoints.openai.responses.context.logger" ], "n_typable": 160, "n_typed": 105, "n_any": 0, "n_untyped": 55, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 49, "n_method_overloads": 49, "n_method_params": 60, "n_classes": 6, "n_attrs": 47, "n_properties": 4, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/responses/harmony.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.openai.responses.harmony.response_previous_input_to_harmony", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.harmony.response_input_to_harmony", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.harmony.construct_harmony_previous_input_messages", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.harmony.parser_state_to_response_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.responses.harmony.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.harmony.harmony_to_response_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.responses.harmony", "names": [ "vllm.entrypoints.openai.responses.harmony.construct_harmony_previous_input_messages", "vllm.entrypoints.openai.responses.harmony.harmony_to_response_output", "vllm.entrypoints.openai.responses.harmony.logger", "vllm.entrypoints.openai.responses.harmony.parser_state_to_response_output", "vllm.entrypoints.openai.responses.harmony.response_input_to_harmony", "vllm.entrypoints.openai.responses.harmony.response_previous_input_to_harmony" ], "n_typable": 12, "n_typed": 10, "n_any": 0, "n_untyped": 2, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/responses/protocol.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.openai.responses.protocol.OutputTokensDetails", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "OutputTokensDetails.reasoning_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OutputTokensDetails.tool_output_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OutputTokensDetails.output_tokens_per_turn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OutputTokensDetails.tool_output_tokens_per_turn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.responses.protocol.StreamingResponsesResponse", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.protocol.ResponseReasoningPartAddedEvent", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ResponseReasoningPartAddedEvent.content_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseReasoningPartAddedEvent.item_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseReasoningPartAddedEvent.output_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseReasoningPartAddedEvent.part", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseReasoningPartAddedEvent.sequence_number", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseReasoningPartAddedEvent.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.protocol.ResponseUsage", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ResponseUsage.input_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseUsage.input_tokens_details", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseUsage.output_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseUsage.output_tokens_details", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseUsage.total_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.protocol.ResponseCreatedEvent", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ResponseCreatedEvent.response", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.protocol.serialize_messages", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.protocol.InputTokensDetails", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "InputTokensDetails.cached_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputTokensDetails.input_tokens_per_turn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputTokensDetails.cached_tokens_per_turn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.protocol.ResponseRawMessageAndToken", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ResponseRawMessageAndToken.message", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseRawMessageAndToken.tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseRawMessageAndToken.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.protocol.ResponsesResponse", "methods": [ { "kind": "function", "name": "ResponsesResponse.serialize_output_messages", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ResponsesResponse.serialize_input_messages", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ResponsesResponse.from_request", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ResponsesResponse.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.created_at", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.incomplete_details", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.instructions", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.parallel_tool_calls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.temperature", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.tool_choice", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.tools", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.top_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.background", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.max_output_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.max_tool_calls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.previous_response_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.reasoning", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.service_tier", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.status", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.top_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.truncation", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.user", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.input_messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesResponse.output_messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 44, "n_typed": 38, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 13, "n_attrs": 28, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.protocol.ResponseCompletedEvent", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ResponseCompletedEvent.response", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.responses.protocol.ResponseInputOutputItem", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.protocol.ResponseInProgressEvent", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ResponseInProgressEvent.response", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.responses.protocol.ResponseInputOutputMessage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.protocol.ResponsesRequest", "methods": [ { "kind": "function", "name": "ResponsesRequest.build_chat_params", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ResponsesRequest.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ResponsesRequest.to_sampling_params", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ResponsesRequest.is_include_output_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ResponsesRequest.validate_background", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ResponsesRequest.validate_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ResponsesRequest.check_cache_salt_support", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ResponsesRequest.function_call_parsing", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ResponsesRequest.background", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.include", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.input", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.instructions", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.max_output_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.max_tool_calls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.logit_bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.parallel_tool_calls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.previous_response_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.reasoning", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.service_tier", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.store", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.temperature", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.tool_choice", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.tools", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.top_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.top_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.top_k", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.truncation", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.user", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.skip_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.include_stop_str_in_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.prompt_cache_key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.request_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.mm_processor_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.priority", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.cache_salt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.enable_response_messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.previous_input_messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.structured_outputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.repetition_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.seed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.stop", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.ignore_eos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest.vllm_xargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponsesRequest._DEFAULT_SAMPLING_PARAMS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 57, "n_typed": 49, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 9, "n_attrs": 41, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.protocol.serialize_message", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.responses.protocol.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.protocol.ResponseReasoningPartDoneEvent", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ResponseReasoningPartDoneEvent.content_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseReasoningPartDoneEvent.item_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseReasoningPartDoneEvent.output_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseReasoningPartDoneEvent.part", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseReasoningPartDoneEvent.sequence_number", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ResponseReasoningPartDoneEvent.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": [ "override" ] }, { "kind": "type", "rules": [ "override" ] }, { "kind": "type", "rules": [ "override" ] } ], "name": "vllm.entrypoints.openai.responses.protocol", "names": [ "vllm.entrypoints.openai.responses.protocol.InputTokensDetails", "vllm.entrypoints.openai.responses.protocol.OutputTokensDetails", "vllm.entrypoints.openai.responses.protocol.ResponseCompletedEvent", "vllm.entrypoints.openai.responses.protocol.ResponseCreatedEvent", "vllm.entrypoints.openai.responses.protocol.ResponseInProgressEvent", "vllm.entrypoints.openai.responses.protocol.ResponseInputOutputItem", "vllm.entrypoints.openai.responses.protocol.ResponseInputOutputMessage", "vllm.entrypoints.openai.responses.protocol.ResponseRawMessageAndToken", "vllm.entrypoints.openai.responses.protocol.ResponseReasoningPartAddedEvent", "vllm.entrypoints.openai.responses.protocol.ResponseReasoningPartDoneEvent", "vllm.entrypoints.openai.responses.protocol.ResponseUsage", "vllm.entrypoints.openai.responses.protocol.ResponsesRequest", "vllm.entrypoints.openai.responses.protocol.ResponsesResponse", "vllm.entrypoints.openai.responses.protocol.StreamingResponsesResponse", "vllm.entrypoints.openai.responses.protocol.logger", "vllm.entrypoints.openai.responses.protocol.serialize_message", "vllm.entrypoints.openai.responses.protocol.serialize_messages" ], "n_typable": 139, "n_typed": 120, "n_any": 0, "n_untyped": 19, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 2, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 22, "n_classes": 11, "n_attrs": 103, "n_properties": 0, "n_type_ignores": 3 }, { "path": "vllm/entrypoints/openai/responses/serving.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.openai.responses.serving.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.serving.OpenAIServingResponses", "methods": [ { "kind": "function", "name": "OpenAIServingResponses.__init__", "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "OpenAIServingResponses._validate_generator_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingResponses._validate_create_responses_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingResponses.create_responses", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServingResponses._make_request", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServingResponses._make_request_with_harmony", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServingResponses._initialize_tool_sessions", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServingResponses.responses_full_generator", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "OpenAIServingResponses._topk_logprobs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServingResponses._create_response_logprobs", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OpenAIServingResponses._create_stream_response_logprobs", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OpenAIServingResponses._make_response_output_items", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServingResponses._make_response_output_items_with_harmony", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingResponses._extract_system_message_from_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingResponses._construct_harmony_system_input_message", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServingResponses._construct_input_messages_with_harmony", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServingResponses._run_background_request_stream", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServingResponses._run_background_request", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServingResponses.responses_background_stream_generator", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServingResponses.retrieve_responses", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServingResponses.cancel_responses", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingResponses._make_not_found_error", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingResponses._make_store_not_supported_error", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OpenAIServingResponses._process_simple_streaming_events", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "OpenAIServingResponses._process_harmony_streaming_events", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "OpenAIServingResponses.responses_stream_generator", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenAIServingResponses.chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.chat_template_content_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.enable_log_outputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.enable_prompt_tokens_details", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.enable_force_include_usage", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.default_sampling_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.override_max_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.enable_store", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.use_harmony", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.enable_auto_tools", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.response_store", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.response_store_lock", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.msg_store", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.event_store", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.background_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.tool_server", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingResponses.tool_call_id_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 137, "n_typed": 115, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 26, "n_method_overloads": 26, "n_method_params": 93, "n_attrs": 18, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.responses.serving", "names": [ "vllm.entrypoints.openai.responses.serving.OpenAIServingResponses", "vllm.entrypoints.openai.responses.serving.logger" ], "n_typable": 138, "n_typed": 115, "n_any": 0, "n_untyped": 23, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 26, "n_method_overloads": 26, "n_method_params": 93, "n_classes": 1, "n_attrs": 19, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/responses/streaming_events.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.openai.responses.streaming_events.emit_tool_action_events", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.streaming_events.emit_browser_tool_events", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.streaming_events.emit_mcp_completion_events", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.streaming_events.emit_text_output_done_events", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.streaming_events.is_mcp_tool_by_namespace", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.responses.streaming_events.StreamingState", "methods": [ { "kind": "function", "name": "StreamingState.reset_for_new_item", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StreamingState.current_content_index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingState.current_output_index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingState.current_item_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingState.current_call_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingState.sent_output_item_added", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingState.is_first_function_call_delta", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.streaming_events.emit_text_delta_events", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.streaming_events.emit_reasoning_done_events", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.streaming_events.emit_function_call_done_events", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.streaming_events.emit_mcp_delta_events", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.streaming_events.emit_content_delta_events", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.streaming_events.emit_code_interpreter_completion_events", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.streaming_events.emit_code_interpreter_delta_events", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.streaming_events.emit_previous_item_done_events", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.streaming_events.emit_reasoning_delta_events", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.streaming_events.emit_function_call_delta_events", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.entrypoints.openai.responses.streaming_events.TOOL_NAME_TO_MCP_SERVER_LABEL", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.responses.streaming_events", "names": [ "vllm.entrypoints.openai.responses.streaming_events.StreamingState", "vllm.entrypoints.openai.responses.streaming_events.TOOL_NAME_TO_MCP_SERVER_LABEL", "vllm.entrypoints.openai.responses.streaming_events.emit_browser_tool_events", "vllm.entrypoints.openai.responses.streaming_events.emit_code_interpreter_completion_events", "vllm.entrypoints.openai.responses.streaming_events.emit_code_interpreter_delta_events", "vllm.entrypoints.openai.responses.streaming_events.emit_content_delta_events", "vllm.entrypoints.openai.responses.streaming_events.emit_function_call_delta_events", "vllm.entrypoints.openai.responses.streaming_events.emit_function_call_done_events", "vllm.entrypoints.openai.responses.streaming_events.emit_mcp_completion_events", "vllm.entrypoints.openai.responses.streaming_events.emit_mcp_delta_events", "vllm.entrypoints.openai.responses.streaming_events.emit_previous_item_done_events", "vllm.entrypoints.openai.responses.streaming_events.emit_reasoning_delta_events", "vllm.entrypoints.openai.responses.streaming_events.emit_reasoning_done_events", "vllm.entrypoints.openai.responses.streaming_events.emit_text_delta_events", "vllm.entrypoints.openai.responses.streaming_events.emit_text_output_done_events", "vllm.entrypoints.openai.responses.streaming_events.emit_tool_action_events", "vllm.entrypoints.openai.responses.streaming_events.is_mcp_tool_by_namespace" ], "n_typable": 51, "n_typed": 51, "n_any": 0, "n_untyped": 0, "n_functions": 15, "n_function_overloads": 15, "n_function_params": 34, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/responses/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.openai.responses.utils.construct_tool_dicts", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.utils.convert_tool_responses_to_completions_format", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.utils.construct_input_messages", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.utils.should_continue_final_message", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.utils.extract_tool_types", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.responses.utils.construct_chat_messages_with_tool_call", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.responses.utils", "names": [ "vllm.entrypoints.openai.responses.utils.construct_chat_messages_with_tool_call", "vllm.entrypoints.openai.responses.utils.construct_input_messages", "vllm.entrypoints.openai.responses.utils.construct_tool_dicts", "vllm.entrypoints.openai.responses.utils.convert_tool_responses_to_completions_format", "vllm.entrypoints.openai.responses.utils.extract_tool_types", "vllm.entrypoints.openai.responses.utils.should_continue_final_message" ], "n_typable": 16, "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 10, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/run_batch.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.make_transcription_wrapper", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.parse_args", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.run_batch.args", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.run_batch.BatchResponseData", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "BatchResponseData.status_code", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchResponseData.request_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchResponseData.body", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.run_batch.WrapperFn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.run_batch.BatchRequestOutput", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "BatchRequestOutput.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchRequestOutput.custom_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchRequestOutput.response", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchRequestOutput.error", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.handle_endpoint_request", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.make_async_error_request_output", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.build_endpoint_registry", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.entrypoints.openai.run_batch.BatchRequestInput", "methods": [ { "kind": "function", "name": "BatchRequestInput.check_type_for_url", "n_typed": 1, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BatchRequestInput.custom_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchRequestInput.method", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchRequestInput.url", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchRequestInput.body", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 1, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.download_bytes_from_url", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.run_batch.BatchTranslationRequest", "methods": [ { "kind": "function", "name": "BatchTranslationRequest.validate_no_file", "n_typed": 0, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BatchTranslationRequest.file_url", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchTranslationRequest.file", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 2, "n_any": 1, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.upload_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.entrypoints.openai.run_batch.BatchTranscriptionRequest", "methods": [ { "kind": "function", "name": "BatchTranscriptionRequest.validate_no_file", "n_typed": 0, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BatchTranscriptionRequest.file_url", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchTranscriptionRequest.file", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 2, "n_any": 1, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.run_request", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.read_file", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.run_batch.BatchProgressTracker", "methods": [ { "kind": "function", "name": "BatchProgressTracker.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchProgressTracker.submitted", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchProgressTracker.completed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchProgressTracker.pbar", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.run_batch", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.make_arg_parser", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.main", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.write_local_file", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.validate_run_batch_args", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.run_batch.BatchFrontendArgs", "methods": [ { "kind": "function", "name": "BatchFrontendArgs._customize_cli_kwargs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BatchFrontendArgs.input_file", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchFrontendArgs.output_file", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchFrontendArgs.output_tmp_dir", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchFrontendArgs.enable_metrics", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchFrontendArgs.host", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchFrontendArgs.port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchFrontendArgs.url", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 7, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.make_error_request_output", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.run_batch.write_file", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.entrypoints.openai.run_batch.BatchRequestInputBody", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.run_batch.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] } ], "name": "vllm.entrypoints.openai.run_batch", "names": [ "vllm.entrypoints.openai.run_batch.BatchFrontendArgs", "vllm.entrypoints.openai.run_batch.BatchProgressTracker", "vllm.entrypoints.openai.run_batch.BatchRequestInput", "vllm.entrypoints.openai.run_batch.BatchRequestInputBody", "vllm.entrypoints.openai.run_batch.BatchRequestOutput", "vllm.entrypoints.openai.run_batch.BatchResponseData", "vllm.entrypoints.openai.run_batch.BatchTranscriptionRequest", "vllm.entrypoints.openai.run_batch.BatchTranslationRequest", "vllm.entrypoints.openai.run_batch.WrapperFn", "vllm.entrypoints.openai.run_batch.args", "vllm.entrypoints.openai.run_batch.build_endpoint_registry", "vllm.entrypoints.openai.run_batch.download_bytes_from_url", "vllm.entrypoints.openai.run_batch.handle_endpoint_request", "vllm.entrypoints.openai.run_batch.logger", "vllm.entrypoints.openai.run_batch.main", "vllm.entrypoints.openai.run_batch.make_arg_parser", "vllm.entrypoints.openai.run_batch.make_async_error_request_output", "vllm.entrypoints.openai.run_batch.make_error_request_output", "vllm.entrypoints.openai.run_batch.make_transcription_wrapper", "vllm.entrypoints.openai.run_batch.parse_args", "vllm.entrypoints.openai.run_batch.read_file", "vllm.entrypoints.openai.run_batch.run_batch", "vllm.entrypoints.openai.run_batch.run_request", "vllm.entrypoints.openai.run_batch.upload_data", "vllm.entrypoints.openai.run_batch.validate_run_batch_args", "vllm.entrypoints.openai.run_batch.write_file", "vllm.entrypoints.openai.run_batch.write_local_file" ], "n_typable": 85, "n_typed": 69, "n_any": 3, "n_untyped": 13, "n_functions": 16, "n_function_overloads": 16, "n_function_params": 30, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 5, "n_classes": 7, "n_attrs": 26, "n_properties": 0, "n_type_ignores": 2 }, { "path": "vllm/entrypoints/openai/server_utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.openai.server_utils.SSEDecoder", "methods": [ { "kind": "function", "name": "SSEDecoder.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SSEDecoder.decode_chunk", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SSEDecoder.extract_content", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SSEDecoder.add_content", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SSEDecoder.get_complete_content", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SSEDecoder.buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SSEDecoder.content_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 7, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.server_utils.validation_exception_handler", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.entrypoints.openai.server_utils.AuthenticationMiddleware", "methods": [ { "kind": "function", "name": "AuthenticationMiddleware.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AuthenticationMiddleware.verify_token", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AuthenticationMiddleware.__call__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AuthenticationMiddleware.app", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AuthenticationMiddleware.api_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.server_utils.log_response", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.server_utils.get_uvicorn_log_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.server_utils.http_exception_handler", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.server_utils.lifespan", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.server_utils.XRequestIdMiddleware", "methods": [ { "kind": "function", "name": "XRequestIdMiddleware.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XRequestIdMiddleware.__call__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "XRequestIdMiddleware.app", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.server_utils.load_log_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.server_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.server_utils", "names": [ "vllm.entrypoints.openai.server_utils.AuthenticationMiddleware", "vllm.entrypoints.openai.server_utils.SSEDecoder", "vllm.entrypoints.openai.server_utils.XRequestIdMiddleware", "vllm.entrypoints.openai.server_utils.get_uvicorn_log_config", "vllm.entrypoints.openai.server_utils.http_exception_handler", "vllm.entrypoints.openai.server_utils.lifespan", "vllm.entrypoints.openai.server_utils.load_log_config", "vllm.entrypoints.openai.server_utils.log_response", "vllm.entrypoints.openai.server_utils.logger", "vllm.entrypoints.openai.server_utils.validation_exception_handler" ], "n_typable": 44, "n_typed": 32, "n_any": 0, "n_untyped": 12, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 9, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 13, "n_classes": 3, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/speech_to_text/api_router.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.openai.speech_to_text.api_router.create_translations", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.speech_to_text.api_router.translation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.speech_to_text.api_router.init_transcription_state", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.api_router.RequestLogger", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.entrypoints.openai.speech_to_text.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.speech_to_text.api_router.transcription", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.openai.speech_to_text.api_router.create_transcriptions", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.speech_to_text.api_router", "names": [ "vllm.entrypoints.openai.speech_to_text.api_router.RequestLogger", "vllm.entrypoints.openai.speech_to_text.api_router.attach_router", "vllm.entrypoints.openai.speech_to_text.api_router.create_transcriptions", "vllm.entrypoints.openai.speech_to_text.api_router.create_translations", "vllm.entrypoints.openai.speech_to_text.api_router.init_transcription_state", "vllm.entrypoints.openai.speech_to_text.api_router.logger", "vllm.entrypoints.openai.speech_to_text.api_router.router", "vllm.entrypoints.openai.speech_to_text.api_router.transcription", "vllm.entrypoints.openai.speech_to_text.api_router.translation" ], "n_typable": 20, "n_typed": 14, "n_any": 0, "n_untyped": 6, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 12, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/speech_to_text/protocol.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranslationResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TranslationResponse.text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionWord", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TranscriptionWord.end", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionWord.start", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionWord.word", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TranscriptionResponse.text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionResponse.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranslationResponseStreamChoice", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TranslationResponseStreamChoice.delta", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationResponseStreamChoice.finish_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationResponseStreamChoice.stop_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.protocol.AudioResponseFormat", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionUsageAudio", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TranscriptionUsageAudio.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionUsageAudio.seconds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranslationWord", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TranslationWord.end", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationWord.start", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationWord.word", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionStreamResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TranscriptionStreamResponse.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionStreamResponse.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionStreamResponse.created", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionStreamResponse.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionStreamResponse.choices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionStreamResponse.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranslationSegment", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TranslationSegment.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationSegment.avg_logprob", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationSegment.compression_ratio", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationSegment.end", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationSegment.no_speech_prob", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationSegment.seek", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationSegment.start", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationSegment.temperature", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationSegment.text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationSegment.tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranslationResponseVariant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionResponseVariant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionRequest", "methods": [ { "kind": "function", "name": "TranscriptionRequest.to_sampling_params", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TranscriptionRequest.validate_transcription_request", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TranscriptionRequest.file", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.language", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.response_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.timestamp_granularities", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.stream_include_usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.stream_continuous_usage_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.vllm_xargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.to_language", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.temperature", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.top_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.top_k", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.min_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.seed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.frequency_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.repetition_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.presence_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest.max_completion_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionRequest._DEFAULT_SAMPLING_PARAMS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 26, "n_typed": 24, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 21, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranslationStreamResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TranslationStreamResponse.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationStreamResponse.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationStreamResponse.created", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationStreamResponse.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationStreamResponse.choices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationStreamResponse.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranslationResponseVerbose", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TranslationResponseVerbose.duration", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationResponseVerbose.language", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationResponseVerbose.text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationResponseVerbose.segments", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationResponseVerbose.words", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionResponseVerbose", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TranscriptionResponseVerbose.duration", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionResponseVerbose.language", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionResponseVerbose.text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionResponseVerbose.segments", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionResponseVerbose.words", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranslationRequest", "methods": [ { "kind": "function", "name": "TranslationRequest.to_sampling_params", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TranslationRequest.validate_stream_options", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TranslationRequest.file", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationRequest.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationRequest.prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationRequest.response_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationRequest.seed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationRequest.temperature", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationRequest.language", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationRequest.to_language", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationRequest.stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationRequest.stream_include_usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationRequest.stream_continuous_usage_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationRequest.max_completion_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranslationRequest._DEFAULT_SAMPLING_PARAMS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionSegment", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TranscriptionSegment.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionSegment.avg_logprob", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionSegment.compression_ratio", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionSegment.end", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionSegment.no_speech_prob", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionSegment.seek", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionSegment.start", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionSegment.temperature", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionSegment.text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionSegment.tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionResponseStreamChoice", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TranscriptionResponseStreamChoice.delta", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionResponseStreamChoice.finish_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TranscriptionResponseStreamChoice.stop_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.protocol.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.speech_to_text.protocol", "names": [ "vllm.entrypoints.openai.speech_to_text.protocol.AudioResponseFormat", "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionRequest", "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionResponse", "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionResponseStreamChoice", "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionResponseVariant", "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionResponseVerbose", "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionSegment", "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionStreamResponse", "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionUsageAudio", "vllm.entrypoints.openai.speech_to_text.protocol.TranscriptionWord", "vllm.entrypoints.openai.speech_to_text.protocol.TranslationRequest", "vllm.entrypoints.openai.speech_to_text.protocol.TranslationResponse", "vllm.entrypoints.openai.speech_to_text.protocol.TranslationResponseStreamChoice", "vllm.entrypoints.openai.speech_to_text.protocol.TranslationResponseVariant", "vllm.entrypoints.openai.speech_to_text.protocol.TranslationResponseVerbose", "vllm.entrypoints.openai.speech_to_text.protocol.TranslationSegment", "vllm.entrypoints.openai.speech_to_text.protocol.TranslationStreamResponse", "vllm.entrypoints.openai.speech_to_text.protocol.TranslationWord", "vllm.entrypoints.openai.speech_to_text.protocol.logger" ], "n_typable": 107, "n_typed": 102, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_classes": 15, "n_attrs": 97, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/speech_to_text/serving.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.serving.OpenAIServingTranslation", "methods": [ { "kind": "function", "name": "OpenAIServingTranslation.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "OpenAIServingTranslation.create_translation", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServingTranslation.translation_stream_generator", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 17, "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 14, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.serving.OpenAIServingTranscription", "methods": [ { "kind": "function", "name": "OpenAIServingTranscription.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "OpenAIServingTranscription.create_transcription", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServingTranscription.transcription_stream_generator", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 17, "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 14, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.serving.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.speech_to_text.serving", "names": [ "vllm.entrypoints.openai.speech_to_text.serving.OpenAIServingTranscription", "vllm.entrypoints.openai.speech_to_text.serving.OpenAIServingTranslation", "vllm.entrypoints.openai.speech_to_text.serving.logger" ], "n_typable": 35, "n_typed": 32, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 28, "n_classes": 2, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/openai/speech_to_text/speech_to_text.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.speech_to_text.SpeechToTextSegment", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.speech_to_text.SpeechToTextResponse", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.speech_to_text.S", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.speech_to_text.ResponseType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.speech_to_text.T", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.speech_to_text.V", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.entrypoints.openai.speech_to_text.speech_to_text.OpenAISpeechToText", "methods": [ { "kind": "function", "name": "OpenAISpeechToText.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "OpenAISpeechToText._warmup_audio_preprocessing", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OpenAISpeechToText._warmup_input_processor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OpenAISpeechToText._detect_language", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAISpeechToText._preprocess_speech_to_text", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAISpeechToText._preprocess_verbose_prompt", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAISpeechToText._get_verbose_segments", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OpenAISpeechToText._create_speech_to_text", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OpenAISpeechToText._speech_to_text_stream_generator", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [ { "kind": "property", "name": "OpenAISpeechToText.model_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "OpenAISpeechToText.default_sampling_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAISpeechToText.task_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenAISpeechToText.asr_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAISpeechToText.enable_force_include_usage", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAISpeechToText.max_audio_filesize_mb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAISpeechToText.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 47, "n_typed": 40, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 31, "n_attrs": 6, "n_properties": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.speech_to_text.SpeechToTextResponseVerbose", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.speech_to_text.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.openai.speech_to_text.speech_to_text.librosa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": [ "assignment" ] } ], "name": "vllm.entrypoints.openai.speech_to_text.speech_to_text", "names": [ "vllm.entrypoints.openai.speech_to_text.speech_to_text.OpenAISpeechToText", "vllm.entrypoints.openai.speech_to_text.speech_to_text.ResponseType", "vllm.entrypoints.openai.speech_to_text.speech_to_text.S", "vllm.entrypoints.openai.speech_to_text.speech_to_text.SpeechToTextResponse", "vllm.entrypoints.openai.speech_to_text.speech_to_text.SpeechToTextResponseVerbose", "vllm.entrypoints.openai.speech_to_text.speech_to_text.SpeechToTextSegment", "vllm.entrypoints.openai.speech_to_text.speech_to_text.T", "vllm.entrypoints.openai.speech_to_text.speech_to_text.V", "vllm.entrypoints.openai.speech_to_text.speech_to_text.librosa", "vllm.entrypoints.openai.speech_to_text.speech_to_text.logger" ], "n_typable": 53, "n_typed": 44, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 31, "n_classes": 1, "n_attrs": 15, "n_properties": 1, "n_type_ignores": 1 }, { "path": "vllm/entrypoints/openai/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.openai.utils.maybe_filter_parallel_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.openai.utils.validate_json_request", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.openai.utils", "names": [ "vllm.entrypoints.openai.utils.maybe_filter_parallel_tool_calls", "vllm.entrypoints.openai.utils.validate_json_request" ], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/__init__.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.pooling.RequestLogger", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.entrypoints.pooling.init_pooling_state", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.entrypoints.pooling.register_pooling_api_routers", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.SupportedTask", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling", "names": [ "vllm.entrypoints.pooling.RequestLogger", "vllm.entrypoints.pooling.SupportedTask", "vllm.entrypoints.pooling.init_pooling_state", "vllm.entrypoints.pooling.register_pooling_api_routers" ], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/base/io_processor.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.pooling.base.io_processor.PoolingIOProcessor", "methods": [ { "kind": "function", "name": "PoolingIOProcessor.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PoolingIOProcessor.pre_process_online", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PoolingIOProcessor.pre_process_online_async", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PoolingIOProcessor.pre_process_offline", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PoolingIOProcessor.pre_process_offline_async", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PoolingIOProcessor.post_process", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingIOProcessor.post_process_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingIOProcessor.create_pooling_params", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingIOProcessor._preprocess_completion_online", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PoolingIOProcessor._preprocess_chat_online", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "PoolingIOProcessor._preprocess_completion_offline", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PoolingIOProcessor._validate_chat_template", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingIOProcessor.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PoolingIOProcessor.renderer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PoolingIOProcessor.chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PoolingIOProcessor.chat_template_content_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingIOProcessor.trust_request_chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 46, "n_typed": 26, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 29, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.base.io_processor", "names": [ "vllm.entrypoints.pooling.base.io_processor.PoolingIOProcessor" ], "n_typable": 46, "n_typed": 26, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 29, "n_classes": 1, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/base/protocol.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.pooling.base.protocol.PoolingBasicRequestMixin", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingBasicRequestMixin.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingBasicRequestMixin.user", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingBasicRequestMixin.truncate_prompt_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingBasicRequestMixin.request_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingBasicRequestMixin.priority", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingBasicRequestMixin.mm_processor_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingBasicRequestMixin.cache_salt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.base.protocol.EncodingRequestMixin", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EncodingRequestMixin.encoding_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EncodingRequestMixin.embed_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EncodingRequestMixin.endianness", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.base.protocol.CompletionRequestMixin", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CompletionRequestMixin.input", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompletionRequestMixin.add_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.base.protocol.ClassifyRequestMixin", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ClassifyRequestMixin.use_activation", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.base.protocol.EmbedRequestMixin", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EmbedRequestMixin.dimensions", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbedRequestMixin.use_activation", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.base.protocol.ChatRequestMixin", "methods": [ { "kind": "function", "name": "ChatRequestMixin.check_generation_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChatRequestMixin.build_chat_params", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatRequestMixin.messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatRequestMixin.add_generation_prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatRequestMixin.continue_final_message", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatRequestMixin.add_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatRequestMixin.chat_template", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChatRequestMixin.chat_template_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.base.protocol", "names": [ "vllm.entrypoints.pooling.base.protocol.ChatRequestMixin", "vllm.entrypoints.pooling.base.protocol.ClassifyRequestMixin", "vllm.entrypoints.pooling.base.protocol.CompletionRequestMixin", "vllm.entrypoints.pooling.base.protocol.EmbedRequestMixin", "vllm.entrypoints.pooling.base.protocol.EncodingRequestMixin", "vllm.entrypoints.pooling.base.protocol.PoolingBasicRequestMixin" ], "n_typable": 26, "n_typed": 24, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_classes": 6, "n_attrs": 21, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/base/serving.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.pooling.base.serving.PoolingServeContext", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingServeContext.request", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingServeContext.raw_request", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingServeContext.model_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingServeContext.request_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingServeContext.created_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingServeContext.lora_request", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingServeContext.engine_prompts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingServeContext.result_generator", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingServeContext.final_res_batch", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingServeContext.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.base.serving.PoolingServing", "methods": [ { "kind": "function", "name": "PoolingServing.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "PoolingServing.init_io_processor", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PoolingServing.__call__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PoolingServing._preprocess", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingServing._prepare_generators", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingServing._collect_batch", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingServing._build_response", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingServing._base_request_id", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PoolingServing._is_model_supported", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingServing._check_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingServing._validate_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingServing._get_trace_headers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingServing._maybe_get_adapters", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PoolingServing._get_active_default_mm_loras", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingServing._get_message_types", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingServing._log_inputs", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingServing.request_id_prefix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingServing.engine_client", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PoolingServing.models", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PoolingServing.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PoolingServing.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PoolingServing.request_logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PoolingServing.return_tokens_as_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PoolingServing.log_error_stack", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PoolingServing.chat_template_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PoolingServing.io_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 57, "n_typed": 43, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 31, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.base.serving.PoolingRequestT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.base.serving", "names": [ "vllm.entrypoints.pooling.base.serving.PoolingRequestT", "vllm.entrypoints.pooling.base.serving.PoolingServeContext", "vllm.entrypoints.pooling.base.serving.PoolingServing" ], "n_typable": 58, "n_typed": 43, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 31, "n_classes": 2, "n_attrs": 21, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/classify/api_router.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.pooling.classify.api_router.classify", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.classify.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.pooling.classify.api_router.create_classify", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.classify.api_router", "names": [ "vllm.entrypoints.pooling.classify.api_router.classify", "vllm.entrypoints.pooling.classify.api_router.create_classify", "vllm.entrypoints.pooling.classify.api_router.router" ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/classify/io_processor.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.pooling.classify.io_processor.ClassifyIOProcessor", "methods": [ { "kind": "function", "name": "ClassifyIOProcessor.pre_process_online", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ClassifyIOProcessor.pre_process_offline", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.classify.io_processor", "names": [ "vllm.entrypoints.pooling.classify.io_processor.ClassifyIOProcessor" ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/classify/protocol.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.pooling.classify.protocol.ClassificationRequest", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.pooling.classify.protocol.ClassificationResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ClassificationResponse.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ClassificationResponse.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ClassificationResponse.created", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ClassificationResponse.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ClassificationResponse.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ClassificationResponse.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.classify.protocol.ClassificationChatRequest", "methods": [ { "kind": "function", "name": "ClassificationChatRequest.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ClassificationChatRequest.to_pooling_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.classify.protocol.ClassificationCompletionRequest", "methods": [ { "kind": "function", "name": "ClassificationCompletionRequest.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ClassificationCompletionRequest.to_pooling_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.classify.protocol.ClassificationData", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ClassificationData.index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ClassificationData.label", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ClassificationData.probs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ClassificationData.num_classes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.classify.protocol.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.classify.protocol", "names": [ "vllm.entrypoints.pooling.classify.protocol.ClassificationChatRequest", "vllm.entrypoints.pooling.classify.protocol.ClassificationCompletionRequest", "vllm.entrypoints.pooling.classify.protocol.ClassificationData", "vllm.entrypoints.pooling.classify.protocol.ClassificationRequest", "vllm.entrypoints.pooling.classify.protocol.ClassificationResponse", "vllm.entrypoints.pooling.classify.protocol.logger" ], "n_typable": 18, "n_typed": 15, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_classes": 4, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/classify/serving.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.pooling.classify.serving.ClassificationServeContext", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.classify.serving.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.pooling.classify.serving.ServingClassification", "methods": [ { "kind": "function", "name": "ServingClassification.init_io_processor", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ServingClassification._build_response", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ServingClassification.request_id_prefix", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.classify.serving", "names": [ "vllm.entrypoints.pooling.classify.serving.ClassificationServeContext", "vllm.entrypoints.pooling.classify.serving.ServingClassification", "vllm.entrypoints.pooling.classify.serving.logger" ], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/embed/api_router.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.pooling.embed.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.pooling.embed.api_router.embedding", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.embed.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.pooling.embed.api_router.create_embedding", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.embed.api_router", "names": [ "vllm.entrypoints.pooling.embed.api_router.create_embedding", "vllm.entrypoints.pooling.embed.api_router.embedding", "vllm.entrypoints.pooling.embed.api_router.logger", "vllm.entrypoints.pooling.embed.api_router.router" ], "n_typable": 7, "n_typed": 4, "n_any": 0, "n_untyped": 3, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/embed/protocol.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.pooling.embed.protocol.EmbeddingRequest", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.pooling.embed.protocol.EmbeddingCompletionRequest", "methods": [ { "kind": "function", "name": "EmbeddingCompletionRequest.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EmbeddingCompletionRequest.to_pooling_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.embed.protocol.EmbeddingBytesResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EmbeddingBytesResponse.content", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbeddingBytesResponse.headers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbeddingBytesResponse.media_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.embed.protocol.EmbeddingChatRequest", "methods": [ { "kind": "function", "name": "EmbeddingChatRequest.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EmbeddingChatRequest.to_pooling_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.embed.protocol.EmbeddingResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EmbeddingResponse.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbeddingResponse.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbeddingResponse.created", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbeddingResponse.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbeddingResponse.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbeddingResponse.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.embed.protocol.EmbeddingResponseData", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EmbeddingResponseData.index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbeddingResponseData.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbeddingResponseData.embedding", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.embed.protocol", "names": [ "vllm.entrypoints.pooling.embed.protocol.EmbeddingBytesResponse", "vllm.entrypoints.pooling.embed.protocol.EmbeddingChatRequest", "vllm.entrypoints.pooling.embed.protocol.EmbeddingCompletionRequest", "vllm.entrypoints.pooling.embed.protocol.EmbeddingRequest", "vllm.entrypoints.pooling.embed.protocol.EmbeddingResponse", "vllm.entrypoints.pooling.embed.protocol.EmbeddingResponseData" ], "n_typable": 19, "n_typed": 17, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_classes": 5, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/embed/serving.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.pooling.embed.serving.EmbeddingServeContext", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.embed.serving.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.pooling.embed.serving.OpenAIServingEmbedding", "methods": [ { "kind": "function", "name": "OpenAIServingEmbedding.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "OpenAIServingEmbedding._preprocess", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingEmbedding.request_output_to_embed_json_response", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "OpenAIServingEmbedding.request_output_to_embed_bytes_response", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "OpenAIServingEmbedding._build_response", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingEmbedding._get_max_position_embeddings", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OpenAIServingEmbedding._should_use_chunked_processing", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingEmbedding._process_chunked_request", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OpenAIServingEmbedding._validate_input", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIServingEmbedding._create_single_prompt_generator", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OpenAIServingEmbedding._prepare_generators", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingEmbedding._collect_batch", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIServingEmbedding.create_embedding", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenAIServingEmbedding.request_id_prefix", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OpenAIServingEmbedding.chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingEmbedding.chat_template_content_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingEmbedding.trust_request_chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingEmbedding.pooler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 58, "n_typed": 54, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 41, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.embed.serving", "names": [ "vllm.entrypoints.pooling.embed.serving.EmbeddingServeContext", "vllm.entrypoints.pooling.embed.serving.OpenAIServingEmbedding", "vllm.entrypoints.pooling.embed.serving.logger" ], "n_typable": 60, "n_typed": 55, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 41, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/io_processor_factories.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.pooling.io_processor_factories.init_pooling_io_processors", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.io_processor_factories", "names": [ "vllm.entrypoints.pooling.io_processor_factories.init_pooling_io_processors" ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/pooling/api_router.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.pooling.pooling.api_router.pooling", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.pooling.pooling.api_router.create_pooling", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.pooling.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.pooling.api_router", "names": [ "vllm.entrypoints.pooling.pooling.api_router.create_pooling", "vllm.entrypoints.pooling.pooling.api_router.pooling", "vllm.entrypoints.pooling.pooling.api_router.router" ], "n_typable": 6, "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/pooling/protocol.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.pooling.pooling.protocol.IOProcessorRequest", "methods": [ { "kind": "function", "name": "IOProcessorRequest.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "IOProcessorRequest.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "IOProcessorRequest.task", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.pooling.protocol.PoolingBytesResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingBytesResponse.content", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingBytesResponse.headers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingBytesResponse.media_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.pooling.protocol.PoolingChatRequest", "methods": [ { "kind": "function", "name": "PoolingChatRequest.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingChatRequest.to_pooling_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingChatRequest.task", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.pooling.protocol.PoolingCompletionRequest", "methods": [ { "kind": "function", "name": "PoolingCompletionRequest.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingCompletionRequest.to_pooling_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingCompletionRequest.task", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.pooling.protocol.T", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.pooling.protocol.PoolingResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingResponse.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingResponse.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingResponse.created", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingResponse.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingResponse.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingResponse.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.pooling.protocol.PoolingResponseData", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingResponseData.index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingResponseData.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PoolingResponseData.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.pooling.protocol.IOProcessorResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "IOProcessorResponse.request_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "IOProcessorResponse.created_at", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "IOProcessorResponse.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.pooling.protocol.PoolingRequest", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.pooling.protocol", "names": [ "vllm.entrypoints.pooling.pooling.protocol.IOProcessorRequest", "vllm.entrypoints.pooling.pooling.protocol.IOProcessorResponse", "vllm.entrypoints.pooling.pooling.protocol.PoolingBytesResponse", "vllm.entrypoints.pooling.pooling.protocol.PoolingChatRequest", "vllm.entrypoints.pooling.pooling.protocol.PoolingCompletionRequest", "vllm.entrypoints.pooling.pooling.protocol.PoolingRequest", "vllm.entrypoints.pooling.pooling.protocol.PoolingResponse", "vllm.entrypoints.pooling.pooling.protocol.PoolingResponseData", "vllm.entrypoints.pooling.pooling.protocol.T" ], "n_typable": 28, "n_typed": 26, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 3, "n_classes": 7, "n_attrs": 21, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/pooling/serving.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.pooling.pooling.serving.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.pooling.pooling.serving.OpenAIServingPooling", "methods": [ { "kind": "function", "name": "OpenAIServingPooling.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "OpenAIServingPooling.create_pooling", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServingPooling.request_output_to_pooling_json_response", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "OpenAIServingPooling.request_output_to_pooling_bytes_response", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "OpenAIServingPooling.request_output_to_pooling_response", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenAIServingPooling.chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingPooling.chat_template_content_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingPooling.trust_request_chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 38, "n_typed": 36, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 30, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.pooling.serving", "names": [ "vllm.entrypoints.pooling.pooling.serving.OpenAIServingPooling", "vllm.entrypoints.pooling.pooling.serving.logger" ], "n_typable": 39, "n_typed": 36, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 30, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/score/api_router.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.pooling.score.api_router.do_rerank", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.pooling.score.api_router.create_score_v1", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.score.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.pooling.score.api_router.create_score", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.pooling.score.api_router.do_rerank_v1", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.pooling.score.api_router.score", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.pooling.score.api_router.do_rerank_v2", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.pooling.score.api_router.rerank", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.score.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.score.api_router", "names": [ "vllm.entrypoints.pooling.score.api_router.create_score", "vllm.entrypoints.pooling.score.api_router.create_score_v1", "vllm.entrypoints.pooling.score.api_router.do_rerank", "vllm.entrypoints.pooling.score.api_router.do_rerank_v1", "vllm.entrypoints.pooling.score.api_router.do_rerank_v2", "vllm.entrypoints.pooling.score.api_router.logger", "vllm.entrypoints.pooling.score.api_router.rerank", "vllm.entrypoints.pooling.score.api_router.router", "vllm.entrypoints.pooling.score.api_router.score" ], "n_typable": 21, "n_typed": 14, "n_any": 0, "n_untyped": 7, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 12, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/score/protocol.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.pooling.score.protocol.ScoreResponseData", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ScoreResponseData.index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ScoreResponseData.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ScoreResponseData.score", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.score.protocol.RerankRequest", "methods": [ { "kind": "function", "name": "RerankRequest.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RerankRequest.to_pooling_params", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RerankRequest.query", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RerankRequest.documents", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RerankRequest.top_n", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.score.protocol.ScoreTextRequest", "methods": [], "properties": [ { "kind": "property", "name": "ScoreTextRequest.data_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ScoreTextRequest.data_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ScoreTextRequest.text_1", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ScoreTextRequest.text_2", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 2 }, { "kind": "class", "name": "vllm.entrypoints.pooling.score.protocol.RerankDocument", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RerankDocument.text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RerankDocument.multi_modal", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.score.protocol.RerankUsage", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RerankUsage.prompt_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RerankUsage.total_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.score.protocol.ScoreQueriesItemsRequest", "methods": [], "properties": [ { "kind": "property", "name": "ScoreQueriesItemsRequest.data_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ScoreQueriesItemsRequest.data_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ScoreQueriesItemsRequest.queries", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ScoreQueriesItemsRequest.items", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 2 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.score.protocol.ScoreRequest", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.pooling.score.protocol.ScoreDataRequest", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ScoreDataRequest.data_1", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ScoreDataRequest.data_2", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.score.protocol.ScoreResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ScoreResponse.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ScoreResponse.object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ScoreResponse.created", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ScoreResponse.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ScoreResponse.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ScoreResponse.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.score.protocol.ScoreRequestMixin", "methods": [ { "kind": "function", "name": "ScoreRequestMixin.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ScoreRequestMixin.to_pooling_params", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.score.protocol.ScoreQueriesDocumentsRequest", "methods": [], "properties": [ { "kind": "property", "name": "ScoreQueriesDocumentsRequest.data_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ScoreQueriesDocumentsRequest.data_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ScoreQueriesDocumentsRequest.queries", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ScoreQueriesDocumentsRequest.documents", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 2 }, { "kind": "class", "name": "vllm.entrypoints.pooling.score.protocol.RerankResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RerankResponse.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RerankResponse.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RerankResponse.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RerankResponse.results", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.pooling.score.protocol.RerankResult", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RerankResult.index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RerankResult.document", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RerankResult.relevance_score", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.score.protocol", "names": [ "vllm.entrypoints.pooling.score.protocol.RerankDocument", "vllm.entrypoints.pooling.score.protocol.RerankRequest", "vllm.entrypoints.pooling.score.protocol.RerankResponse", "vllm.entrypoints.pooling.score.protocol.RerankResult", "vllm.entrypoints.pooling.score.protocol.RerankUsage", "vllm.entrypoints.pooling.score.protocol.ScoreDataRequest", "vllm.entrypoints.pooling.score.protocol.ScoreQueriesDocumentsRequest", "vllm.entrypoints.pooling.score.protocol.ScoreQueriesItemsRequest", "vllm.entrypoints.pooling.score.protocol.ScoreRequest", "vllm.entrypoints.pooling.score.protocol.ScoreRequestMixin", "vllm.entrypoints.pooling.score.protocol.ScoreResponse", "vllm.entrypoints.pooling.score.protocol.ScoreResponseData", "vllm.entrypoints.pooling.score.protocol.ScoreTextRequest" ], "n_typable": 46, "n_typed": 38, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_classes": 12, "n_attrs": 32, "n_properties": 6, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/score/serving.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.pooling.score.serving.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.pooling.score.serving.ServingScores", "methods": [ { "kind": "function", "name": "ServingScores.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ServingScores._embedding_score", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ServingScores._preprocess_late_interaction_item", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ServingScores._late_interaction_score", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ServingScores._cross_encoding_score", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ServingScores._preprocess_score", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ServingScores._run_scoring", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ServingScores.create_score", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ServingScores.do_rerank", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ServingScores.request_output_to_score_response", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ServingScores.request_output_to_rerank_response", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ServingScores.score_template", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ServingScores.use_gpu_for_pooling_score", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ServingScores.is_cross_encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ServingScores.is_multimodal_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ServingScores.architecture", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ServingScores.is_late_interaction", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 69, "n_typed": 63, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 52, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.score.serving", "names": [ "vllm.entrypoints.pooling.score.serving.ServingScores", "vllm.entrypoints.pooling.score.serving.logger" ], "n_typable": 70, "n_typed": 63, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 52, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/score/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.pooling.score.utils.get_score_prompt", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "class", "name": "vllm.entrypoints.pooling.score.utils.ScoreMultiModalParam", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ScoreMultiModalParam.content", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.pooling.score.utils.parse_score_data_single", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.score.utils.ScoreInputs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.entrypoints.pooling.score.utils.score_data_to_prompts", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.score.utils.ScoreData", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.entrypoints.pooling.score.utils.post_process_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.pooling.score.utils.parse_score_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.entrypoints.pooling.score.utils.compute_maxsim_scores", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.entrypoints.pooling.score.utils.compress_token_type_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.score.utils.ScoreInput", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.entrypoints.pooling.score.utils.compute_maxsim_score", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.score.utils.ScoreContentPartParam", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.pooling.score.utils.validate_score_input", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.score.utils", "names": [ "vllm.entrypoints.pooling.score.utils.ScoreContentPartParam", "vllm.entrypoints.pooling.score.utils.ScoreData", "vllm.entrypoints.pooling.score.utils.ScoreInput", "vllm.entrypoints.pooling.score.utils.ScoreInputs", "vllm.entrypoints.pooling.score.utils.ScoreMultiModalParam", "vllm.entrypoints.pooling.score.utils.compress_token_type_ids", "vllm.entrypoints.pooling.score.utils.compute_maxsim_score", "vllm.entrypoints.pooling.score.utils.compute_maxsim_scores", "vllm.entrypoints.pooling.score.utils.get_score_prompt", "vllm.entrypoints.pooling.score.utils.parse_score_data", "vllm.entrypoints.pooling.score.utils.parse_score_data_single", "vllm.entrypoints.pooling.score.utils.post_process_tokens", "vllm.entrypoints.pooling.score.utils.score_data_to_prompts", "vllm.entrypoints.pooling.score.utils.validate_score_input" ], "n_typable": 39, "n_typed": 39, "n_any": 0, "n_untyped": 0, "n_functions": 9, "n_function_overloads": 9, "n_function_params": 29, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/typing.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.pooling.typing.PoolingChatLikeRequest", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.typing.AnyPoolingRequest", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.typing.AnyPoolingResponse", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.pooling.typing.PoolingCompletionLikeRequest", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.typing", "names": [ "vllm.entrypoints.pooling.typing.AnyPoolingRequest", "vllm.entrypoints.pooling.typing.AnyPoolingResponse", "vllm.entrypoints.pooling.typing.PoolingChatLikeRequest", "vllm.entrypoints.pooling.typing.PoolingCompletionLikeRequest" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/pooling/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.pooling.utils.encode_pooling_output_binary", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.entrypoints.pooling.utils.build_metadata_items", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.entrypoints.pooling.utils.encode_pooling_output_base64", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.entrypoints.pooling.utils.MetadataItem", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MetadataItem.index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MetadataItem.embed_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MetadataItem.endianness", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MetadataItem.start", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MetadataItem.end", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MetadataItem.shape", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.pooling.utils.encode_pooling_output_float", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.pooling.utils.decode_pooling_output", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.pooling.utils.encode_pooling_bytes", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.entrypoints.pooling.utils", "names": [ "vllm.entrypoints.pooling.utils.MetadataItem", "vllm.entrypoints.pooling.utils.build_metadata_items", "vllm.entrypoints.pooling.utils.decode_pooling_output", "vllm.entrypoints.pooling.utils.encode_pooling_bytes", "vllm.entrypoints.pooling.utils.encode_pooling_output_base64", "vllm.entrypoints.pooling.utils.encode_pooling_output_binary", "vllm.entrypoints.pooling.utils.encode_pooling_output_float" ], "n_typable": 22, "n_typed": 22, "n_any": 0, "n_untyped": 0, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 16, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/sagemaker/api_router.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.sagemaker.api_router.EndpointFn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.sagemaker.api_router.get_invocation_types", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.sagemaker.api_router.attach_router", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.sagemaker.api_router.GetHandlerFn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.sagemaker.api_router.sagemaker_standards_bootstrap", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.sagemaker.api_router", "names": [ "vllm.entrypoints.sagemaker.api_router.EndpointFn", "vllm.entrypoints.sagemaker.api_router.GetHandlerFn", "vllm.entrypoints.sagemaker.api_router.attach_router", "vllm.entrypoints.sagemaker.api_router.get_invocation_types", "vllm.entrypoints.sagemaker.api_router.sagemaker_standards_bootstrap" ], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 4, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/__init__.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.serve.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.register_vllm_serve_api_routers", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve", "names": [ "vllm.entrypoints.serve.logger", "vllm.entrypoints.serve.register_vllm_serve_api_routers" ], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/cache/api_router.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.serve.cache.api_router.reset_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.serve.cache.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.cache.api_router.reset_prefix_cache", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.entrypoints.serve.cache.api_router.engine_client", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.cache.api_router.reset_encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.cache.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.serve.cache.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.cache.api_router", "names": [ "vllm.entrypoints.serve.cache.api_router.attach_router", "vllm.entrypoints.serve.cache.api_router.engine_client", "vllm.entrypoints.serve.cache.api_router.logger", "vllm.entrypoints.serve.cache.api_router.reset_encoder_cache", "vllm.entrypoints.serve.cache.api_router.reset_mm_cache", "vllm.entrypoints.serve.cache.api_router.reset_prefix_cache", "vllm.entrypoints.serve.cache.api_router.router" ], "n_typable": 14, "n_typed": 8, "n_any": 0, "n_untyped": 6, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/disagg/api_router.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.serve.disagg.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.disagg.api_router.generate_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.disagg.api_router.engine_client", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.disagg.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.serve.disagg.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.disagg.api_router.tokenization", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.disagg.api_router.generate", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.disagg.api_router", "names": [ "vllm.entrypoints.serve.disagg.api_router.attach_router", "vllm.entrypoints.serve.disagg.api_router.engine_client", "vllm.entrypoints.serve.disagg.api_router.generate", "vllm.entrypoints.serve.disagg.api_router.generate_tokens", "vllm.entrypoints.serve.disagg.api_router.logger", "vllm.entrypoints.serve.disagg.api_router.router", "vllm.entrypoints.serve.disagg.api_router.tokenization" ], "n_typable": 13, "n_typed": 9, "n_any": 0, "n_untyped": 4, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/disagg/protocol.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.serve.disagg.protocol.GenerateRequest", "methods": [ { "kind": "function", "name": "GenerateRequest.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GenerateRequest.request_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.sampling_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.stream_options", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.cache_salt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.priority", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.kv_transfer_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.serve.disagg.protocol.GenerateResponseChoice", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "GenerateResponseChoice.index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateResponseChoice.logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateResponseChoice.finish_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateResponseChoice.token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.serve.disagg.protocol.GenerateResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "GenerateResponse.request_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateResponse.choices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateResponse.prompt_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateResponse.kv_transfer_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.disagg.protocol", "names": [ "vllm.entrypoints.serve.disagg.protocol.GenerateRequest", "vllm.entrypoints.serve.disagg.protocol.GenerateResponse", "vllm.entrypoints.serve.disagg.protocol.GenerateResponseChoice" ], "n_typable": 20, "n_typed": 20, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_classes": 3, "n_attrs": 18, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/disagg/serving.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.serve.disagg.serving.ServingTokens", "methods": [ { "kind": "function", "name": "ServingTokens.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "ServingTokens.serve_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ServingTokens.serve_tokens_full_generator", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ServingTokens._create_tokens_logprobs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ServingTokens.enable_prompt_tokens_details", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ServingTokens.enable_log_outputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ServingTokens.force_no_detokenize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 21, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 18, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.serve.disagg.serving.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.disagg.serving", "names": [ "vllm.entrypoints.serve.disagg.serving.ServingTokens", "vllm.entrypoints.serve.disagg.serving.logger" ], "n_typable": 26, "n_typed": 21, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 18, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/elastic_ep/api_router.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.serve.elastic_ep.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.elastic_ep.api_router.scale_elastic_ep", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.elastic_ep.api_router.engine_client", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.elastic_ep.api_router.is_scaling_elastic_ep", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.elastic_ep.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.serve.elastic_ep.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.elastic_ep.api_router", "names": [ "vllm.entrypoints.serve.elastic_ep.api_router.attach_router", "vllm.entrypoints.serve.elastic_ep.api_router.engine_client", "vllm.entrypoints.serve.elastic_ep.api_router.is_scaling_elastic_ep", "vllm.entrypoints.serve.elastic_ep.api_router.logger", "vllm.entrypoints.serve.elastic_ep.api_router.router", "vllm.entrypoints.serve.elastic_ep.api_router.scale_elastic_ep" ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 4, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/elastic_ep/middleware.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.serve.elastic_ep.middleware.ScalingMiddleware", "methods": [ { "kind": "function", "name": "ScalingMiddleware.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ScalingMiddleware.__call__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ScalingMiddleware.app", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.entrypoints.serve.elastic_ep.middleware.get_scaling_elastic_ep", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.entrypoints.serve.elastic_ep.middleware.set_scaling_elastic_ep", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.elastic_ep.middleware", "names": [ "vllm.entrypoints.serve.elastic_ep.middleware.ScalingMiddleware", "vllm.entrypoints.serve.elastic_ep.middleware.get_scaling_elastic_ep", "vllm.entrypoints.serve.elastic_ep.middleware.set_scaling_elastic_ep" ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 1, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/instrumentator/__init__.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.serve.instrumentator.register_instrumentator_api_routers", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.instrumentator", "names": [ "vllm.entrypoints.serve.instrumentator.register_instrumentator_api_routers" ], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/instrumentator/basic.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.serve.instrumentator.basic.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.instrumentator.basic.get_server_load_metrics", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.instrumentator.basic.show_version", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.entrypoints.serve.instrumentator.basic.engine_client", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.serve.instrumentator.basic.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.instrumentator.basic.tokenization", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.instrumentator.basic.base", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.instrumentator.basic", "names": [ "vllm.entrypoints.serve.instrumentator.basic.base", "vllm.entrypoints.serve.instrumentator.basic.engine_client", "vllm.entrypoints.serve.instrumentator.basic.get_server_load_metrics", "vllm.entrypoints.serve.instrumentator.basic.logger", "vllm.entrypoints.serve.instrumentator.basic.router", "vllm.entrypoints.serve.instrumentator.basic.show_version", "vllm.entrypoints.serve.instrumentator.basic.tokenization" ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 4, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/instrumentator/health.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.serve.instrumentator.health.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.serve.instrumentator.health.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.instrumentator.health.health", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.instrumentator.health.engine_client", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.instrumentator.health", "names": [ "vllm.entrypoints.serve.instrumentator.health.engine_client", "vllm.entrypoints.serve.instrumentator.health.health", "vllm.entrypoints.serve.instrumentator.health.logger", "vllm.entrypoints.serve.instrumentator.health.router" ], "n_typable": 6, "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 2, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/instrumentator/metrics.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.serve.instrumentator.metrics.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.entrypoints.serve.instrumentator.metrics.PrometheusResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PrometheusResponse.media_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.instrumentator.metrics", "names": [ "vllm.entrypoints.serve.instrumentator.metrics.PrometheusResponse", "vllm.entrypoints.serve.instrumentator.metrics.attach_router" ], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/instrumentator/offline_docs.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.serve.instrumentator.offline_docs.attach_router", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.serve.instrumentator.offline_docs.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.instrumentator.offline_docs", "names": [ "vllm.entrypoints.serve.instrumentator.offline_docs.attach_router", "vllm.entrypoints.serve.instrumentator.offline_docs.logger" ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/instrumentator/server_info.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.serve.instrumentator.server_info.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.instrumentator.server_info.show_server_info", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.serve.instrumentator.server_info.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.serve.instrumentator.server_info.PydanticVllmConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.instrumentator.server_info", "names": [ "vllm.entrypoints.serve.instrumentator.server_info.PydanticVllmConfig", "vllm.entrypoints.serve.instrumentator.server_info.logger", "vllm.entrypoints.serve.instrumentator.server_info.router", "vllm.entrypoints.serve.instrumentator.server_info.show_server_info" ], "n_typable": 6, "n_typed": 2, "n_any": 0, "n_untyped": 4, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/lora/api_router.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.serve.lora.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.entrypoints.serve.lora.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.lora.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.lora.api_router", "names": [ "vllm.entrypoints.serve.lora.api_router.attach_router", "vllm.entrypoints.serve.lora.api_router.logger", "vllm.entrypoints.serve.lora.api_router.router" ], "n_typable": 4, "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/lora/protocol.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.serve.lora.protocol.UnloadLoRAAdapterRequest", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "UnloadLoRAAdapterRequest.lora_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UnloadLoRAAdapterRequest.lora_int_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.serve.lora.protocol.LoadLoRAAdapterRequest", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LoadLoRAAdapterRequest.lora_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoadLoRAAdapterRequest.lora_path", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoadLoRAAdapterRequest.load_inplace", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.lora.protocol", "names": [ "vllm.entrypoints.serve.lora.protocol.LoadLoRAAdapterRequest", "vllm.entrypoints.serve.lora.protocol.UnloadLoRAAdapterRequest" ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 2, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/profile/api_router.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.serve.profile.api_router.start_profile", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.serve.profile.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.profile.api_router.engine_client", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.profile.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.profile.api_router.stop_profile", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.serve.profile.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.profile.api_router", "names": [ "vllm.entrypoints.serve.profile.api_router.attach_router", "vllm.entrypoints.serve.profile.api_router.engine_client", "vllm.entrypoints.serve.profile.api_router.logger", "vllm.entrypoints.serve.profile.api_router.router", "vllm.entrypoints.serve.profile.api_router.start_profile", "vllm.entrypoints.serve.profile.api_router.stop_profile" ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 4, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/rlhf/api_router.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.serve.rlhf.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.rlhf.api_router.init_weight_transfer_engine", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.rlhf.api_router.update_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.rlhf.api_router.engine_client", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.rlhf.api_router.resume_generation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.rlhf.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.rlhf.api_router.is_paused", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.rlhf.api_router.get_world_size", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.serve.rlhf.api_router.pause_generation", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.entrypoints.serve.rlhf.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.rlhf.api_router", "names": [ "vllm.entrypoints.serve.rlhf.api_router.attach_router", "vllm.entrypoints.serve.rlhf.api_router.engine_client", "vllm.entrypoints.serve.rlhf.api_router.get_world_size", "vllm.entrypoints.serve.rlhf.api_router.init_weight_transfer_engine", "vllm.entrypoints.serve.rlhf.api_router.is_paused", "vllm.entrypoints.serve.rlhf.api_router.logger", "vllm.entrypoints.serve.rlhf.api_router.pause_generation", "vllm.entrypoints.serve.rlhf.api_router.resume_generation", "vllm.entrypoints.serve.rlhf.api_router.router", "vllm.entrypoints.serve.rlhf.api_router.update_weights" ], "n_typable": 22, "n_typed": 16, "n_any": 0, "n_untyped": 6, "n_functions": 8, "n_function_overloads": 8, "n_function_params": 12, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/rpc/api_router.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.serve.rpc.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.rpc.api_router.engine_client", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.rpc.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.serve.rpc.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.rpc.api_router.collective_rpc", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.rpc.api_router", "names": [ "vllm.entrypoints.serve.rpc.api_router.attach_router", "vllm.entrypoints.serve.rpc.api_router.collective_rpc", "vllm.entrypoints.serve.rpc.api_router.engine_client", "vllm.entrypoints.serve.rpc.api_router.logger", "vllm.entrypoints.serve.rpc.api_router.router" ], "n_typable": 8, "n_typed": 4, "n_any": 0, "n_untyped": 4, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/sleep/api_router.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.serve.sleep.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.sleep.api_router.wake_up", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.sleep.api_router.is_sleeping", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.sleep.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.sleep.api_router.engine_client", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.serve.sleep.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.sleep.api_router.sleep", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.sleep.api_router", "names": [ "vllm.entrypoints.serve.sleep.api_router.attach_router", "vllm.entrypoints.serve.sleep.api_router.engine_client", "vllm.entrypoints.serve.sleep.api_router.is_sleeping", "vllm.entrypoints.serve.sleep.api_router.logger", "vllm.entrypoints.serve.sleep.api_router.router", "vllm.entrypoints.serve.sleep.api_router.sleep", "vllm.entrypoints.serve.sleep.api_router.wake_up" ], "n_typable": 12, "n_typed": 6, "n_any": 0, "n_untyped": 6, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 5, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/tokenize/api_router.py", "symbol_reports": [ { "kind": "function", "name": "vllm.entrypoints.serve.tokenize.api_router.tokenize", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.serve.tokenize.api_router.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.tokenize.api_router.detokenize", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.serve.tokenize.api_router.attach_router", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.serve.tokenize.api_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.serve.tokenize.api_router.tokenization", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.tokenize.api_router", "names": [ "vllm.entrypoints.serve.tokenize.api_router.attach_router", "vllm.entrypoints.serve.tokenize.api_router.detokenize", "vllm.entrypoints.serve.tokenize.api_router.logger", "vllm.entrypoints.serve.tokenize.api_router.router", "vllm.entrypoints.serve.tokenize.api_router.tokenization", "vllm.entrypoints.serve.tokenize.api_router.tokenize" ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/tokenize/protocol.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.serve.tokenize.protocol.TokenizeCompletionRequest", "methods": [ { "kind": "function", "name": "TokenizeCompletionRequest.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TokenizeCompletionRequest.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizeCompletionRequest.prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizeCompletionRequest.add_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizeCompletionRequest.return_token_strs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.serve.tokenize.protocol.TokenizeChatRequest", "methods": [ { "kind": "function", "name": "TokenizeChatRequest.check_generation_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TokenizeChatRequest.build_chat_params", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TokenizeChatRequest.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TokenizeChatRequest.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizeChatRequest.messages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizeChatRequest.add_generation_prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizeChatRequest.return_token_strs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizeChatRequest.continue_final_message", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizeChatRequest.add_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizeChatRequest.chat_template", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizeChatRequest.chat_template_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizeChatRequest.mm_processor_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizeChatRequest.tools", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 17, "n_typed": 15, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.serve.tokenize.protocol.DetokenizeRequest", "methods": [ { "kind": "function", "name": "DetokenizeRequest.build_tok_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DetokenizeRequest.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DetokenizeRequest.tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.serve.tokenize.protocol.TokenizerInfoResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TokenizerInfoResponse.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TokenizerInfoResponse.tokenizer_class", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.serve.tokenize.protocol.TokenizeRequest", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.entrypoints.serve.tokenize.protocol.DetokenizeResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DetokenizeResponse.prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.serve.tokenize.protocol.TokenizeResponse", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TokenizeResponse.count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizeResponse.max_model_len", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizeResponse.tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizeResponse.token_strs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.tokenize.protocol", "names": [ "vllm.entrypoints.serve.tokenize.protocol.DetokenizeRequest", "vllm.entrypoints.serve.tokenize.protocol.DetokenizeResponse", "vllm.entrypoints.serve.tokenize.protocol.TokenizeChatRequest", "vllm.entrypoints.serve.tokenize.protocol.TokenizeCompletionRequest", "vllm.entrypoints.serve.tokenize.protocol.TokenizeRequest", "vllm.entrypoints.serve.tokenize.protocol.TokenizeResponse", "vllm.entrypoints.serve.tokenize.protocol.TokenizerInfoResponse" ], "n_typable": 35, "n_typed": 32, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_classes": 6, "n_attrs": 24, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/serve/tokenize/serving.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.serve.tokenize.serving.OpenAIServingTokenization", "methods": [ { "kind": "function", "name": "OpenAIServingTokenization.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "OpenAIServingTokenization.create_tokenize", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServingTokenization.create_detokenize", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenAIServingTokenization.get_tokenizer_info", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenAIServingTokenization.chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingTokenization.chat_template_content_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenAIServingTokenization.trust_request_chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.entrypoints.serve.tokenize.serving.TokenizerInfo", "methods": [ { "kind": "function", "name": "TokenizerInfo.to_dict", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TokenizerInfo._get_tokenizer_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TokenizerInfo._make_json_serializable", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TokenizerInfo.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TokenizerInfo.chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.serve.tokenize.serving.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.serve.tokenize.serving", "names": [ "vllm.entrypoints.serve.tokenize.serving.OpenAIServingTokenization", "vllm.entrypoints.serve.tokenize.serving.TokenizerInfo", "vllm.entrypoints.serve.tokenize.serving.logger" ], "n_typable": 23, "n_typed": 18, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 12, "n_classes": 2, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/ssl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.entrypoints.ssl.SSLCertRefresher", "methods": [ { "kind": "function", "name": "SSLCertRefresher.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SSLCertRefresher._watch_files", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SSLCertRefresher.stop", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SSLCertRefresher.ssl", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SSLCertRefresher.key_path", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SSLCertRefresher.cert_path", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SSLCertRefresher.ca_path", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SSLCertRefresher.watch_ssl_cert_task", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SSLCertRefresher.watch_ssl_ca_task", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 8, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.entrypoints.ssl.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.entrypoints.ssl", "names": [ "vllm.entrypoints.ssl.SSLCertRefresher", "vllm.entrypoints.ssl.logger" ], "n_typable": 16, "n_typed": 8, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/entrypoints/utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.entrypoints.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.entrypoints.utils.create_error_response", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.entrypoints.utils.sanitize_message", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.utils.log_non_default_args", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.utils.ErrorResponse", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.entrypoints.utils.decrement_server_load", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.utils.with_cancellation", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.entrypoints.utils.cli_env_setup", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.entrypoints.utils.process_lora_modules", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.entrypoints.utils.get_max_tokens", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.entrypoints.utils.log_version_and_model", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.entrypoints.utils.VLLM_SUBCMD_PARSER_EPILOG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.entrypoints.utils.should_include_usage", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.entrypoints.utils.ErrorInfo", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.entrypoints.utils.listen_for_disconnect", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.utils.StreamOptions", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.entrypoints.utils.load_aware_call", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.entrypoints.utils.LoRAModulePath", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.entrypoints.utils", "names": [ "vllm.entrypoints.utils.ErrorInfo", "vllm.entrypoints.utils.ErrorResponse", "vllm.entrypoints.utils.LoRAModulePath", "vllm.entrypoints.utils.StreamOptions", "vllm.entrypoints.utils.VLLM_SUBCMD_PARSER_EPILOG", "vllm.entrypoints.utils.cli_env_setup", "vllm.entrypoints.utils.create_error_response", "vllm.entrypoints.utils.decrement_server_load", "vllm.entrypoints.utils.get_max_tokens", "vllm.entrypoints.utils.listen_for_disconnect", "vllm.entrypoints.utils.load_aware_call", "vllm.entrypoints.utils.log_non_default_args", "vllm.entrypoints.utils.log_version_and_model", "vllm.entrypoints.utils.logger", "vllm.entrypoints.utils.process_lora_modules", "vllm.entrypoints.utils.sanitize_message", "vllm.entrypoints.utils.should_include_usage", "vllm.entrypoints.utils.with_cancellation" ], "n_typable": 36, "n_typed": 28, "n_any": 0, "n_untyped": 8, "n_functions": 12, "n_function_overloads": 12, "n_function_params": 23, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/env_override.py", "symbol_reports": [ { "kind": "function", "name": "vllm.env_override.should_partition_patched", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.env_override.memory_plan_reuse_patched", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.env_override.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.env_override.get_graph_partition_signature_patched", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.env_override", "names": [ "vllm.env_override.get_graph_partition_signature_patched", "vllm.env_override.logger", "vllm.env_override.memory_plan_reuse_patched", "vllm.env_override.should_partition_patched" ], "n_typable": 11, "n_typed": 3, "n_any": 0, "n_untyped": 8, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/envs.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.envs.K_SCALE_CONSTANT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.envs.get_env_or_set_default", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.envs.VLLM_DISABLE_SHARED_EXPERTS_STREAM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_FUSED_MOE_GROUPED_TOPK", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_RAY_EXTRA_ENV_VAR_PREFIXES_TO_COPY", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_CPU_OMP_THREADS_BIND", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_SHUFFLE_KV_CACHE_LAYOUT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MODEL_REDIRECT_PATH", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_GPT_OSS_HARMONY_SYSTEM_INSTRUCTIONS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_OBJECT_STORAGE_SHM_BUFFER_NAME", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_MOE_PADDING", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.environment_variables", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.MAX_JOBS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_FLASHINFER_MOE_FP16", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_FLASHINFER_SAMPLER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_KEEP_ALIVE_ON_ENGINE_DEATH", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DO_NOT_TRACK", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DEEP_GEMM_WARMUP", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_RAY_BUNDLE_INDICES", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_TPU_BUCKET_PADDING_GAP", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_USE_SKINNY_GEMM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.envs.use_aot_compile", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_RAY_COMPILED_DAG_CHANNEL_TYPE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_RAY_COMPILED_DAG_OVERLAP_COMM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_CPU_KVCACHE_SPACE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MARLIN_USE_ATOMIC_ADD", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_AOT_COMPILE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DEBUG_DUMP_PATH", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.envs.env_set_with_choices", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.envs.VLLM_RANDOMIZE_DP_DUMMY_INPUTS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_FLASHINFER_MOE_MXFP4_BF16", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.S3_ACCESS_KEY_ID", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_V1_OUTPUT_PROC_CHUNK_SIZE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_NCCL_INCLUDE_PATH", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MOONCAKE_BOOTSTRAP_PORT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.CUDA_VISIBLE_DEVICES", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_LOGGING_COLOR", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_COMPILE_CACHE_SAVE_FORMAT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_TRITON_AWQ", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_USE_AITER_FP4BMM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_RAY_DP_PACK_STRATEGY", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_PATTERN_MATCH_DEBUG", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_CUSTOM_PAGED_ATTN", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.envs.get_default_cache_root", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.envs.VLLM_NVTX_SCOPES_FOR_PROFILING", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MOE_DP_CHUNK_SIZE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ENABLE_FUSED_MOE_ACTIVATION_CHUNKING", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_LOGGING_PREFIX", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_USE_AITER_RMSNORM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.envs.enable_envs_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.envs.VLLM_IMAGE_FETCH_TIMEOUT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DEEPEP_HIGH_THROUGHPUT_FORCE_INTRA_NODE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MORIIO_QP_PER_TRANSFER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MORIIO_POST_BATCH_SIZE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_QUICK_REDUCE_CAST_BF16_TO_FP16", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ALLOW_CHUNKED_LOCAL_ATTN_WITH_HYBRID_KV_CACHE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_NIXL_SIDE_CHANNEL_HOST", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ALLREDUCE_USE_FLASHINFER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_AUDIO_FETCH_TIMEOUT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_FLASHINFER_MOE_INT4", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_WEIGHT_OFFLOADING_DISABLE_UVA", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_GC_DEBUG", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DEEPEP_LOW_LATENCY_USE_MNNVL", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DEEPEPLL_NVFP4_DISPATCH", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USAGE_SOURCE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MEDIA_LOADING_THREAD_COUNT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.LD_LIBRARY_PATH", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MAX_AUDIO_CLIP_FILESIZE_MB", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MAIN_CUDA_VERSION", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_VIDEO_FETCH_TIMEOUT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_NIXL_ABORT_REQUEST_TIMEOUT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_FORCE_AOT_LOAD", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_FLASHINFER_MOE_BACKEND", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_FLASHINFER_MOE_FP4", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.envs.env_list_with_choices", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.envs.VLLM_MEDIA_CONNECTOR", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_USE_AITER_UNIFIED_ATTENTION", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.S3_SECRET_ACCESS_KEY", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_LOGGING_LEVEL", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DISABLE_PYNCCL", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_FP8_PADDING", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_TOOL_PARSE_REGEX_TIMEOUT_SECONDS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ENABLE_MOE_DP_CHUNK", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_RPC_TIMEOUT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.envs.get_default_config_root", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.envs.compile_factors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.envs.VLLM_CUSTOM_SCOPES_FOR_PROFILING", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_OINK_OPS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.LOCAL_RANK", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MLA_DISABLE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_FLASHINFER_MOE_MXFP4_MXFP8", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_API_KEY", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_MODELSCOPE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_USE_AITER_MOE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.envs.get_vllm_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_USE_AITER_MHA", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_HOST_IP", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_QUICK_REDUCE_MAX_SIZE_BYTES_MB", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_LORA_DISABLE_PDL", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ASSETS_CACHE_MODEL_CLEAN", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_USE_AITER_TRITON_ROPE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DISABLE_REQUEST_ID_RANDOMIZATION", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_KV_CACHE_LAYOUT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_SHARED_EXPERTS_STREAM_TOKEN_THRESHOLD", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.envs.env_with_choices", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.envs.VLLM_LOGGING_CONFIG_PATH", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_KV_EVENTS_USE_INT_BLOCK_HASHES", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_COMPUTE_NANS_IN_LOGITS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_CUDART_SO_PATH", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DEBUG_MFU_METRICS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_TUNED_CONFIG_FOLDER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_WORKER_MULTIPROC_METHOD", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_RINGBUFFER_WARNING_INTERVAL", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_QUICK_REDUCE_QUANTIZATION", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_FLASHINFER_MOE_FP8", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_PLUGINS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DISABLE_LOG_LOGO", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MAX_TOKENS_PER_EXPERT_FP4_MOE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ENABLE_CUDA_COMPATIBILITY", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_PRECOMPILED", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.envs.disable_compile_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.envs.VLLM_DBO_COMM_SMS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_NCCL_SYMM_MEM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_V2_MODEL_RUNNER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ENABLE_V1_MULTIPROCESSING", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MM_HASHER_ALGORITHM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_XLA_USE_SPMD", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_NO_USAGE_STATS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_NVFP4_CT_EMULATIONS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_FLASHINFER_WORKSPACE_BUFFER_SIZE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MARLIN_INPUT_DTYPE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MORIIO_NUM_WORKERS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.NO_COLOR", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ENGINE_ITERATION_TIMEOUT_S", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_SERVER_DEV_MODE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ENABLE_RESPONSES_API_STORE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_FLOAT32_MATMUL_PRECISION", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.CMAKE_BUILD_TYPE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_USE_AITER_FUSION_SHARED_EXPERTS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.envs.validate_environ", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_TPU_MOST_MODEL_LEN", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MORIIO_CONNECTOR_READ_MODE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_LOOPBACK_IP", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_VIDEO_LOADER_BACKEND", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_XLA_CACHE_PATH", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VERBOSE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_TRACE_FUNCTION", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_PP_LAYER_PARTITION", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ALLOW_LONG_MAX_MODEL_LEN", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_LOG_BATCHSIZE_INTERVAL", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_FP8_MFMA_PAGE_ATTN", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_LOGGING_STREAM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_USE_AITER_MLA", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_DEEP_GEMM_E8M0", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_TPU_USING_PATHWAYS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_HAS_FLASHINFER_CUBIN", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_FBGEMM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_SLEEP_MEM_CHUNK_SIZE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_GPT_OSS_SYSTEM_TOOL_MCP_LABELS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DP_MASTER_IP", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DEEPEP_BUFFER_SIZE_MB", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ELASTIC_EP_SCALE_UP_LAUNCH", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_FLASHINFER_MOE_MXFP4_MXFP8_CUTLASS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MSGPACK_ZERO_COPY_THRESHOLD", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_EXPERIMENTAL_PARSER_CONTEXT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_SKIP_P2P_CHECK", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.S3_ENDPOINT_URL", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_USE_AITER_TRITON_GEMM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DP_RANK_LOCAL", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MXFP4_USE_MARLIN", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MOE_USE_DEEP_GEMM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_RPC_BASE_PATH", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_RAY_EXTRA_ENV_VARS_TO_COPY", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_NCCL_SO_PATH", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_CPU_NUM_OF_RESERVED_CPU", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_NVFP4_GEMM_BACKEND", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_DEEP_GEMM_TMA_ALIGNED_SCALES", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_MEGA_AOT_ARTIFACT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DP_MASTER_PORT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_USE_AITER_FP8BMM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DEBUG_WORKSPACE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_USE_AITER_LINEAR", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_TOOL_JSON_ERROR_AUTOMATIC_RETRY", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DEBUG_LOG_API_SERVER_RESPONSE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.envs.is_set", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_FUSED_MOE_CHUNK_SIZE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_LOG_STATS_INTERVAL", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ENABLE_PREGRAD_PASSES", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.NVCC_THREADS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_LOG_MODEL_INSPECTION", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_USE_AITER_PAGED_ATTN", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_BYTECODE_HOOK", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USAGE_STATS_SERVER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_CONFIGURE_LOGGING", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.envs.disable_envs_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.envs.VLLM_ENABLE_INDUCTOR_MAX_AUTOTUNE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ALLOW_INSECURE_SERIALIZATION", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_HTTP_TIMEOUT_KEEP_ALIVE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DISABLED_KERNELS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_STANDALONE_COMPILE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MQ_MAX_CHUNK_BYTES_MB", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DISABLE_COMPILE_CACHE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_WEIGHT_OFFLOADING_DISABLE_PIN_MEMORY", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.envs.maybe_convert_int", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_SKIP_PRECOMPILED_VERSION_SUFFIX", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MOONCAKE_ABORT_REQUEST_TIMEOUT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.envs.maybe_convert_bool", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_USE_AITER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_PORT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ELASTIC_EP_DRAIN_REQUESTS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_RAY_PER_WORKER_GPUS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_SLEEP_WHEN_IDLE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DOCKER_BUILD_CONTEXT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_LORA_RESOLVER_HF_REPO_LIST", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.Q_SCALE_CONSTANT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_BLOCKSCALE_FP8_GEMM_FLASHINFER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_LORA_RESOLVER_CACHE_DIR", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_CPU_SGL_KERNEL", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_RAY_WRAPPED_PP_COMM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ROCM_USE_AITER_FP4_ASM_GEMM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ENABLE_INDUCTOR_COORDINATE_DESCENT_TUNING", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_TARGET_DEVICE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_FLASHINFER_ALLREDUCE_BACKEND", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_EXECUTE_MODEL_TIMEOUT_SECONDS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ENABLE_CUDAGRAPH_GC", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_V1_USE_OUTLINES_CACHE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_CUDA_COMPATIBILITY_PATH", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_NIXL_SIDE_CHANNEL_PORT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DP_RANK", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_XGRAMMAR_CACHE_MB", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ALLOW_RUNTIME_LORA_UPDATING", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_CACHE_ROOT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.V_SCALE_CONSTANT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_DP_SIZE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ASSETS_CACHE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ALLREDUCE_USE_SYMM_MEM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_ENGINE_READY_TIMEOUT_S", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_SYSTEM_START_DATE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_CONFIG_ROOT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_XLA_CHECK_RECOMPILATION", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_USE_DEEP_GEMM", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.envs.VLLM_MEDIA_URL_ALLOW_REDIRECTS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.envs", "names": [ "vllm.envs.CMAKE_BUILD_TYPE", "vllm.envs.CUDA_VISIBLE_DEVICES", "vllm.envs.K_SCALE_CONSTANT", "vllm.envs.LD_LIBRARY_PATH", "vllm.envs.LOCAL_RANK", "vllm.envs.MAX_JOBS", "vllm.envs.NO_COLOR", "vllm.envs.NVCC_THREADS", "vllm.envs.Q_SCALE_CONSTANT", "vllm.envs.S3_ACCESS_KEY_ID", "vllm.envs.S3_ENDPOINT_URL", "vllm.envs.S3_SECRET_ACCESS_KEY", "vllm.envs.VERBOSE", "vllm.envs.VLLM_ALLOW_CHUNKED_LOCAL_ATTN_WITH_HYBRID_KV_CACHE", "vllm.envs.VLLM_ALLOW_INSECURE_SERIALIZATION", "vllm.envs.VLLM_ALLOW_LONG_MAX_MODEL_LEN", "vllm.envs.VLLM_ALLOW_RUNTIME_LORA_UPDATING", "vllm.envs.VLLM_ALLREDUCE_USE_FLASHINFER", "vllm.envs.VLLM_ALLREDUCE_USE_SYMM_MEM", "vllm.envs.VLLM_API_KEY", "vllm.envs.VLLM_ASSETS_CACHE", "vllm.envs.VLLM_ASSETS_CACHE_MODEL_CLEAN", "vllm.envs.VLLM_AUDIO_FETCH_TIMEOUT", "vllm.envs.VLLM_BLOCKSCALE_FP8_GEMM_FLASHINFER", "vllm.envs.VLLM_CACHE_ROOT", "vllm.envs.VLLM_COMPILE_CACHE_SAVE_FORMAT", "vllm.envs.VLLM_COMPUTE_NANS_IN_LOGITS", "vllm.envs.VLLM_CONFIGURE_LOGGING", "vllm.envs.VLLM_CONFIG_ROOT", "vllm.envs.VLLM_CPU_KVCACHE_SPACE", "vllm.envs.VLLM_CPU_NUM_OF_RESERVED_CPU", "vllm.envs.VLLM_CPU_OMP_THREADS_BIND", "vllm.envs.VLLM_CPU_SGL_KERNEL", "vllm.envs.VLLM_CUDART_SO_PATH", "vllm.envs.VLLM_CUDA_COMPATIBILITY_PATH", "vllm.envs.VLLM_CUSTOM_SCOPES_FOR_PROFILING", "vllm.envs.VLLM_DBO_COMM_SMS", "vllm.envs.VLLM_DEBUG_DUMP_PATH", "vllm.envs.VLLM_DEBUG_LOG_API_SERVER_RESPONSE", "vllm.envs.VLLM_DEBUG_MFU_METRICS", "vllm.envs.VLLM_DEBUG_WORKSPACE", "vllm.envs.VLLM_DEEPEPLL_NVFP4_DISPATCH", "vllm.envs.VLLM_DEEPEP_BUFFER_SIZE_MB", "vllm.envs.VLLM_DEEPEP_HIGH_THROUGHPUT_FORCE_INTRA_NODE", "vllm.envs.VLLM_DEEPEP_LOW_LATENCY_USE_MNNVL", "vllm.envs.VLLM_DEEP_GEMM_WARMUP", "vllm.envs.VLLM_DISABLED_KERNELS", "vllm.envs.VLLM_DISABLE_COMPILE_CACHE", "vllm.envs.VLLM_DISABLE_LOG_LOGO", "vllm.envs.VLLM_DISABLE_PYNCCL", "vllm.envs.VLLM_DISABLE_REQUEST_ID_RANDOMIZATION", "vllm.envs.VLLM_DISABLE_SHARED_EXPERTS_STREAM", "vllm.envs.VLLM_DOCKER_BUILD_CONTEXT", "vllm.envs.VLLM_DO_NOT_TRACK", "vllm.envs.VLLM_DP_MASTER_IP", "vllm.envs.VLLM_DP_MASTER_PORT", "vllm.envs.VLLM_DP_RANK", "vllm.envs.VLLM_DP_RANK_LOCAL", "vllm.envs.VLLM_DP_SIZE", "vllm.envs.VLLM_ELASTIC_EP_DRAIN_REQUESTS", "vllm.envs.VLLM_ELASTIC_EP_SCALE_UP_LAUNCH", "vllm.envs.VLLM_ENABLE_CUDAGRAPH_GC", "vllm.envs.VLLM_ENABLE_CUDA_COMPATIBILITY", "vllm.envs.VLLM_ENABLE_FUSED_MOE_ACTIVATION_CHUNKING", "vllm.envs.VLLM_ENABLE_INDUCTOR_COORDINATE_DESCENT_TUNING", "vllm.envs.VLLM_ENABLE_INDUCTOR_MAX_AUTOTUNE", "vllm.envs.VLLM_ENABLE_MOE_DP_CHUNK", "vllm.envs.VLLM_ENABLE_PREGRAD_PASSES", "vllm.envs.VLLM_ENABLE_RESPONSES_API_STORE", "vllm.envs.VLLM_ENABLE_V1_MULTIPROCESSING", "vllm.envs.VLLM_ENGINE_ITERATION_TIMEOUT_S", "vllm.envs.VLLM_ENGINE_READY_TIMEOUT_S", "vllm.envs.VLLM_EXECUTE_MODEL_TIMEOUT_SECONDS", "vllm.envs.VLLM_FLASHINFER_ALLREDUCE_BACKEND", "vllm.envs.VLLM_FLASHINFER_MOE_BACKEND", "vllm.envs.VLLM_FLASHINFER_WORKSPACE_BUFFER_SIZE", "vllm.envs.VLLM_FLOAT32_MATMUL_PRECISION", "vllm.envs.VLLM_FORCE_AOT_LOAD", "vllm.envs.VLLM_FUSED_MOE_CHUNK_SIZE", "vllm.envs.VLLM_GC_DEBUG", "vllm.envs.VLLM_GPT_OSS_HARMONY_SYSTEM_INSTRUCTIONS", "vllm.envs.VLLM_GPT_OSS_SYSTEM_TOOL_MCP_LABELS", "vllm.envs.VLLM_HAS_FLASHINFER_CUBIN", "vllm.envs.VLLM_HOST_IP", "vllm.envs.VLLM_HTTP_TIMEOUT_KEEP_ALIVE", "vllm.envs.VLLM_IMAGE_FETCH_TIMEOUT", "vllm.envs.VLLM_KEEP_ALIVE_ON_ENGINE_DEATH", "vllm.envs.VLLM_KV_CACHE_LAYOUT", "vllm.envs.VLLM_KV_EVENTS_USE_INT_BLOCK_HASHES", "vllm.envs.VLLM_LOGGING_COLOR", "vllm.envs.VLLM_LOGGING_CONFIG_PATH", "vllm.envs.VLLM_LOGGING_LEVEL", "vllm.envs.VLLM_LOGGING_PREFIX", "vllm.envs.VLLM_LOGGING_STREAM", "vllm.envs.VLLM_LOG_BATCHSIZE_INTERVAL", "vllm.envs.VLLM_LOG_MODEL_INSPECTION", "vllm.envs.VLLM_LOG_STATS_INTERVAL", "vllm.envs.VLLM_LOOPBACK_IP", "vllm.envs.VLLM_LORA_DISABLE_PDL", "vllm.envs.VLLM_LORA_RESOLVER_CACHE_DIR", "vllm.envs.VLLM_LORA_RESOLVER_HF_REPO_LIST", "vllm.envs.VLLM_MAIN_CUDA_VERSION", "vllm.envs.VLLM_MARLIN_INPUT_DTYPE", "vllm.envs.VLLM_MARLIN_USE_ATOMIC_ADD", "vllm.envs.VLLM_MAX_AUDIO_CLIP_FILESIZE_MB", "vllm.envs.VLLM_MAX_TOKENS_PER_EXPERT_FP4_MOE", "vllm.envs.VLLM_MEDIA_CONNECTOR", "vllm.envs.VLLM_MEDIA_LOADING_THREAD_COUNT", "vllm.envs.VLLM_MEDIA_URL_ALLOW_REDIRECTS", "vllm.envs.VLLM_MLA_DISABLE", "vllm.envs.VLLM_MM_HASHER_ALGORITHM", "vllm.envs.VLLM_MODEL_REDIRECT_PATH", "vllm.envs.VLLM_MOE_DP_CHUNK_SIZE", "vllm.envs.VLLM_MOE_USE_DEEP_GEMM", "vllm.envs.VLLM_MOONCAKE_ABORT_REQUEST_TIMEOUT", "vllm.envs.VLLM_MOONCAKE_BOOTSTRAP_PORT", "vllm.envs.VLLM_MORIIO_CONNECTOR_READ_MODE", "vllm.envs.VLLM_MORIIO_NUM_WORKERS", "vllm.envs.VLLM_MORIIO_POST_BATCH_SIZE", "vllm.envs.VLLM_MORIIO_QP_PER_TRANSFER", "vllm.envs.VLLM_MQ_MAX_CHUNK_BYTES_MB", "vllm.envs.VLLM_MSGPACK_ZERO_COPY_THRESHOLD", "vllm.envs.VLLM_MXFP4_USE_MARLIN", "vllm.envs.VLLM_NCCL_INCLUDE_PATH", "vllm.envs.VLLM_NCCL_SO_PATH", "vllm.envs.VLLM_NIXL_ABORT_REQUEST_TIMEOUT", "vllm.envs.VLLM_NIXL_SIDE_CHANNEL_HOST", "vllm.envs.VLLM_NIXL_SIDE_CHANNEL_PORT", "vllm.envs.VLLM_NO_USAGE_STATS", "vllm.envs.VLLM_NVFP4_GEMM_BACKEND", "vllm.envs.VLLM_NVTX_SCOPES_FOR_PROFILING", "vllm.envs.VLLM_OBJECT_STORAGE_SHM_BUFFER_NAME", "vllm.envs.VLLM_PATTERN_MATCH_DEBUG", "vllm.envs.VLLM_PLUGINS", "vllm.envs.VLLM_PORT", "vllm.envs.VLLM_PP_LAYER_PARTITION", "vllm.envs.VLLM_RANDOMIZE_DP_DUMMY_INPUTS", "vllm.envs.VLLM_RAY_BUNDLE_INDICES", "vllm.envs.VLLM_RAY_DP_PACK_STRATEGY", "vllm.envs.VLLM_RAY_EXTRA_ENV_VARS_TO_COPY", "vllm.envs.VLLM_RAY_EXTRA_ENV_VAR_PREFIXES_TO_COPY", "vllm.envs.VLLM_RAY_PER_WORKER_GPUS", "vllm.envs.VLLM_RINGBUFFER_WARNING_INTERVAL", "vllm.envs.VLLM_ROCM_CUSTOM_PAGED_ATTN", "vllm.envs.VLLM_ROCM_FP8_MFMA_PAGE_ATTN", "vllm.envs.VLLM_ROCM_FP8_PADDING", "vllm.envs.VLLM_ROCM_MOE_PADDING", "vllm.envs.VLLM_ROCM_QUICK_REDUCE_CAST_BF16_TO_FP16", "vllm.envs.VLLM_ROCM_QUICK_REDUCE_MAX_SIZE_BYTES_MB", "vllm.envs.VLLM_ROCM_QUICK_REDUCE_QUANTIZATION", "vllm.envs.VLLM_ROCM_SHUFFLE_KV_CACHE_LAYOUT", "vllm.envs.VLLM_ROCM_SLEEP_MEM_CHUNK_SIZE", "vllm.envs.VLLM_ROCM_USE_AITER", "vllm.envs.VLLM_ROCM_USE_AITER_FP4BMM", "vllm.envs.VLLM_ROCM_USE_AITER_FP4_ASM_GEMM", "vllm.envs.VLLM_ROCM_USE_AITER_FP8BMM", "vllm.envs.VLLM_ROCM_USE_AITER_FUSION_SHARED_EXPERTS", "vllm.envs.VLLM_ROCM_USE_AITER_LINEAR", "vllm.envs.VLLM_ROCM_USE_AITER_MHA", "vllm.envs.VLLM_ROCM_USE_AITER_MLA", "vllm.envs.VLLM_ROCM_USE_AITER_MOE", "vllm.envs.VLLM_ROCM_USE_AITER_PAGED_ATTN", "vllm.envs.VLLM_ROCM_USE_AITER_RMSNORM", "vllm.envs.VLLM_ROCM_USE_AITER_TRITON_GEMM", "vllm.envs.VLLM_ROCM_USE_AITER_TRITON_ROPE", "vllm.envs.VLLM_ROCM_USE_AITER_UNIFIED_ATTENTION", "vllm.envs.VLLM_ROCM_USE_SKINNY_GEMM", "vllm.envs.VLLM_RPC_BASE_PATH", "vllm.envs.VLLM_RPC_TIMEOUT", "vllm.envs.VLLM_SERVER_DEV_MODE", "vllm.envs.VLLM_SHARED_EXPERTS_STREAM_TOKEN_THRESHOLD", "vllm.envs.VLLM_SKIP_P2P_CHECK", "vllm.envs.VLLM_SKIP_PRECOMPILED_VERSION_SUFFIX", "vllm.envs.VLLM_SLEEP_WHEN_IDLE", "vllm.envs.VLLM_SYSTEM_START_DATE", "vllm.envs.VLLM_TARGET_DEVICE", "vllm.envs.VLLM_TOOL_JSON_ERROR_AUTOMATIC_RETRY", "vllm.envs.VLLM_TOOL_PARSE_REGEX_TIMEOUT_SECONDS", "vllm.envs.VLLM_TPU_BUCKET_PADDING_GAP", "vllm.envs.VLLM_TPU_MOST_MODEL_LEN", "vllm.envs.VLLM_TPU_USING_PATHWAYS", "vllm.envs.VLLM_TRACE_FUNCTION", "vllm.envs.VLLM_TUNED_CONFIG_FOLDER", "vllm.envs.VLLM_USAGE_SOURCE", "vllm.envs.VLLM_USAGE_STATS_SERVER", "vllm.envs.VLLM_USE_AOT_COMPILE", "vllm.envs.VLLM_USE_BYTECODE_HOOK", "vllm.envs.VLLM_USE_DEEP_GEMM", "vllm.envs.VLLM_USE_DEEP_GEMM_E8M0", "vllm.envs.VLLM_USE_DEEP_GEMM_TMA_ALIGNED_SCALES", "vllm.envs.VLLM_USE_EXPERIMENTAL_PARSER_CONTEXT", "vllm.envs.VLLM_USE_FBGEMM", "vllm.envs.VLLM_USE_FLASHINFER_MOE_FP16", "vllm.envs.VLLM_USE_FLASHINFER_MOE_FP4", "vllm.envs.VLLM_USE_FLASHINFER_MOE_FP8", "vllm.envs.VLLM_USE_FLASHINFER_MOE_INT4", "vllm.envs.VLLM_USE_FLASHINFER_MOE_MXFP4_BF16", "vllm.envs.VLLM_USE_FLASHINFER_MOE_MXFP4_MXFP8", "vllm.envs.VLLM_USE_FLASHINFER_MOE_MXFP4_MXFP8_CUTLASS", "vllm.envs.VLLM_USE_FLASHINFER_SAMPLER", "vllm.envs.VLLM_USE_FUSED_MOE_GROUPED_TOPK", "vllm.envs.VLLM_USE_MEGA_AOT_ARTIFACT", "vllm.envs.VLLM_USE_MODELSCOPE", "vllm.envs.VLLM_USE_NCCL_SYMM_MEM", "vllm.envs.VLLM_USE_NVFP4_CT_EMULATIONS", "vllm.envs.VLLM_USE_OINK_OPS", "vllm.envs.VLLM_USE_PRECOMPILED", "vllm.envs.VLLM_USE_RAY_COMPILED_DAG_CHANNEL_TYPE", "vllm.envs.VLLM_USE_RAY_COMPILED_DAG_OVERLAP_COMM", "vllm.envs.VLLM_USE_RAY_WRAPPED_PP_COMM", "vllm.envs.VLLM_USE_STANDALONE_COMPILE", "vllm.envs.VLLM_USE_TRITON_AWQ", "vllm.envs.VLLM_USE_V2_MODEL_RUNNER", "vllm.envs.VLLM_V1_OUTPUT_PROC_CHUNK_SIZE", "vllm.envs.VLLM_V1_USE_OUTLINES_CACHE", "vllm.envs.VLLM_VIDEO_FETCH_TIMEOUT", "vllm.envs.VLLM_VIDEO_LOADER_BACKEND", "vllm.envs.VLLM_WEIGHT_OFFLOADING_DISABLE_PIN_MEMORY", "vllm.envs.VLLM_WEIGHT_OFFLOADING_DISABLE_UVA", "vllm.envs.VLLM_WORKER_MULTIPROC_METHOD", "vllm.envs.VLLM_XGRAMMAR_CACHE_MB", "vllm.envs.VLLM_XLA_CACHE_PATH", "vllm.envs.VLLM_XLA_CHECK_RECOMPILATION", "vllm.envs.VLLM_XLA_USE_SPMD", "vllm.envs.V_SCALE_CONSTANT", "vllm.envs.compile_factors", "vllm.envs.disable_compile_cache", "vllm.envs.disable_envs_cache", "vllm.envs.enable_envs_cache", "vllm.envs.env_list_with_choices", "vllm.envs.env_set_with_choices", "vllm.envs.env_with_choices", "vllm.envs.environment_variables", "vllm.envs.get_default_cache_root", "vllm.envs.get_default_config_root", "vllm.envs.get_env_or_set_default", "vllm.envs.get_vllm_port", "vllm.envs.is_set", "vllm.envs.logger", "vllm.envs.maybe_convert_bool", "vllm.envs.maybe_convert_int", "vllm.envs.use_aot_compile", "vllm.envs.validate_environ" ], "n_typable": 261, "n_typed": 257, "n_any": 0, "n_untyped": 4, "n_functions": 16, "n_function_overloads": 16, "n_function_params": 18, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 227, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/exceptions.py", "symbol_reports": [ { "kind": "class", "name": "vllm.exceptions.VLLMValidationError", "methods": [ { "kind": "function", "name": "VLLMValidationError.__init__", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VLLMValidationError.__str__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VLLMValidationError.parameter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VLLMValidationError.value", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 3, "n_any": 1, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.exceptions", "names": [ "vllm.exceptions.VLLMValidationError" ], "n_typable": 7, "n_typed": 3, "n_any": 1, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/forward_context.py", "symbol_reports": [ { "kind": "function", "name": "vllm.forward_context.create_forward_context", "n_typed": 9, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "class", "name": "vllm.forward_context.BatchDescriptor", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "BatchDescriptor.num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BatchDescriptor.num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BatchDescriptor.uniform", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BatchDescriptor.has_lora", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BatchDescriptor.num_active_loras", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.forward_context.override_forward_context", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.forward_context.set_forward_context", "n_typed": 9, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "attr", "name": "vllm.forward_context.forward_start_time", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.forward_context.DPMetadata", "methods": [ { "kind": "function", "name": "DPMetadata.make", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DPMetadata.chunked_sizes", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DPMetadata.sp_local_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DPMetadata.get_chunk_sizes_across_dp_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DPMetadata.cu_tokens_across_sp", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DPMetadata.max_tokens_across_dp_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DPMetadata.num_tokens_across_dp_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DPMetadata.local_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 13, "n_typed": 11, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.forward_context.batchsize_forward_time", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.forward_context.is_forward_context_available", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.forward_context.ForwardContext", "methods": [ { "kind": "function", "name": "ForwardContext.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ForwardContext.no_compile_layers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ForwardContext.attn_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ForwardContext.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ForwardContext.virtual_engine", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ForwardContext.dp_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ForwardContext.cudagraph_runtime_mode", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ForwardContext.batch_descriptor", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ForwardContext.ubatch_slices", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ForwardContext.skip_compiled", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ForwardContext.all_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ForwardContext.moe_layer_index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ForwardContext.additional_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 12, "n_properties": 0 }, { "kind": "attr", "name": "vllm.forward_context.track_batchsize", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.forward_context.last_logging_time", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.forward_context.get_forward_context", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.forward_context.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.forward_context.batchsize_logging_interval", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.forward_context", "names": [ "vllm.forward_context.BatchDescriptor", "vllm.forward_context.DPMetadata", "vllm.forward_context.ForwardContext", "vllm.forward_context.batchsize_forward_time", "vllm.forward_context.batchsize_logging_interval", "vllm.forward_context.create_forward_context", "vllm.forward_context.forward_start_time", "vllm.forward_context.get_forward_context", "vllm.forward_context.is_forward_context_available", "vllm.forward_context.last_logging_time", "vllm.forward_context.logger", "vllm.forward_context.override_forward_context", "vllm.forward_context.set_forward_context", "vllm.forward_context.track_batchsize" ], "n_typable": 46, "n_typed": 37, "n_any": 2, "n_untyped": 7, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 21, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 8, "n_classes": 3, "n_attrs": 26, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/grpc/compile_protos.py", "symbol_reports": [ { "kind": "function", "name": "vllm.grpc.compile_protos.compile_protos", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.grpc.compile_protos", "names": [ "vllm.grpc.compile_protos.compile_protos" ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/grpc/vllm_engine_pb2.pyi", "symbol_reports": [ { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.AbortResponse", "methods": [ { "kind": "function", "name": "AbortResponse.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.GetServerInfoResponse", "methods": [ { "kind": "function", "name": "GetServerInfoResponse.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GetServerInfoResponse.ACTIVE_REQUESTS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetServerInfoResponse.IS_PAUSED_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetServerInfoResponse.LAST_RECEIVE_TIMESTAMP_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetServerInfoResponse.UPTIME_SECONDS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetServerInfoResponse.SERVER_TYPE_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetServerInfoResponse.active_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetServerInfoResponse.is_paused", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetServerInfoResponse.last_receive_timestamp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetServerInfoResponse.uptime_seconds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetServerInfoResponse.server_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.GenerateRequest", "methods": [ { "kind": "function", "name": "GenerateRequest.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GenerateRequest.REQUEST_ID_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.TOKENIZED_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.TEXT_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.SAMPLING_PARAMS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.STREAM_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.request_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.tokenized", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.sampling_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateRequest.stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.GenerateStreamChunk", "methods": [ { "kind": "function", "name": "GenerateStreamChunk.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GenerateStreamChunk.TOKEN_IDS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateStreamChunk.PROMPT_TOKENS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateStreamChunk.COMPLETION_TOKENS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateStreamChunk.CACHED_TOKENS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateStreamChunk.token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateStreamChunk.prompt_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateStreamChunk.completion_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateStreamChunk.cached_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 13, "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.HealthCheckResponse", "methods": [ { "kind": "function", "name": "HealthCheckResponse.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HealthCheckResponse.HEALTHY_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HealthCheckResponse.MESSAGE_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HealthCheckResponse.healthy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HealthCheckResponse.message", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.TokenizedInput", "methods": [ { "kind": "function", "name": "TokenizedInput.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TokenizedInput.ORIGINAL_TEXT_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizedInput.INPUT_IDS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizedInput.original_text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TokenizedInput.input_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.GetServerInfoRequest", "methods": [ { "kind": "function", "name": "GetServerInfoRequest.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.grpc.vllm_engine_pb2.DESCRIPTOR", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.SamplingParams", "methods": [ { "kind": "function", "name": "SamplingParams.__init__", "n_typed": 28, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 28, "n_params": 27, "n_function_overloads": 1, "n_function_params": 27 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SamplingParams.TEMPERATURE_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.TOP_P_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.TOP_K_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.MIN_P_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.FREQUENCY_PENALTY_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.PRESENCE_PENALTY_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.REPETITION_PENALTY_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.MAX_TOKENS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.MIN_TOKENS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.STOP_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.STOP_TOKEN_IDS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.SKIP_SPECIAL_TOKENS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.SPACES_BETWEEN_SPECIAL_TOKENS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.IGNORE_EOS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.N_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.LOGPROBS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.PROMPT_LOGPROBS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.SEED_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.INCLUDE_STOP_STR_IN_OUTPUT_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.LOGIT_BIAS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.TRUNCATE_PROMPT_TOKENS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.JSON_SCHEMA_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.REGEX_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.GRAMMAR_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.STRUCTURAL_TAG_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.JSON_OBJECT_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.CHOICE_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.temperature", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.top_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.top_k", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.min_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.frequency_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.presence_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.repetition_penalty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.max_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.min_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.stop", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.stop_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.skip_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.spaces_between_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.ignore_eos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.n", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.prompt_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.seed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.include_stop_str_in_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.logit_bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.truncate_prompt_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.json_schema", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.regex", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.grammar", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.structural_tag", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.json_object", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SamplingParams.choice", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 82, "n_typed": 82, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 27, "n_attrs": 54, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.HealthCheckRequest", "methods": [ { "kind": "function", "name": "HealthCheckRequest.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.EmbedResponse", "methods": [ { "kind": "function", "name": "EmbedResponse.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EmbedResponse.EMBEDDING_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbedResponse.PROMPT_TOKENS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbedResponse.EMBEDDING_DIM_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbedResponse.embedding", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbedResponse.prompt_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbedResponse.embedding_dim", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.GetModelInfoResponse", "methods": [ { "kind": "function", "name": "GetModelInfoResponse.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GetModelInfoResponse.MODEL_PATH_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetModelInfoResponse.IS_GENERATION_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetModelInfoResponse.MAX_CONTEXT_LENGTH_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetModelInfoResponse.VOCAB_SIZE_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetModelInfoResponse.SUPPORTS_VISION_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetModelInfoResponse.model_path", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetModelInfoResponse.is_generation", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetModelInfoResponse.max_context_length", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetModelInfoResponse.vocab_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GetModelInfoResponse.supports_vision", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.GenerateComplete", "methods": [ { "kind": "function", "name": "GenerateComplete.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GenerateComplete.OUTPUT_IDS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateComplete.FINISH_REASON_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateComplete.PROMPT_TOKENS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateComplete.COMPLETION_TOKENS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateComplete.CACHED_TOKENS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateComplete.output_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateComplete.finish_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateComplete.prompt_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateComplete.completion_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateComplete.cached_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.GetModelInfoRequest", "methods": [ { "kind": "function", "name": "GetModelInfoRequest.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.ChoiceConstraint", "methods": [ { "kind": "function", "name": "ChoiceConstraint.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChoiceConstraint.CHOICES_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChoiceConstraint.choices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.LogitBiasEntry", "methods": [ { "kind": "function", "name": "LogitBiasEntry.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LogitBiasEntry.KEY_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasEntry.VALUE_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasEntry.key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasEntry.value", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.AbortRequest", "methods": [ { "kind": "function", "name": "AbortRequest.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AbortRequest.REQUEST_IDS_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AbortRequest.request_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.EmbedRequest", "methods": [ { "kind": "function", "name": "EmbedRequest.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EmbedRequest.REQUEST_ID_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbedRequest.TOKENIZED_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbedRequest.request_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EmbedRequest.tokenized", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2.GenerateResponse", "methods": [ { "kind": "function", "name": "GenerateResponse.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GenerateResponse.CHUNK_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateResponse.COMPLETE_FIELD_NUMBER", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateResponse.chunk", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GenerateResponse.complete", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.grpc.vllm_engine_pb2", "names": [ "vllm.grpc.vllm_engine_pb2.AbortRequest", "vllm.grpc.vllm_engine_pb2.AbortResponse", "vllm.grpc.vllm_engine_pb2.ChoiceConstraint", "vllm.grpc.vllm_engine_pb2.DESCRIPTOR", "vllm.grpc.vllm_engine_pb2.EmbedRequest", "vllm.grpc.vllm_engine_pb2.EmbedResponse", "vllm.grpc.vllm_engine_pb2.GenerateComplete", "vllm.grpc.vllm_engine_pb2.GenerateRequest", "vllm.grpc.vllm_engine_pb2.GenerateResponse", "vllm.grpc.vllm_engine_pb2.GenerateStreamChunk", "vllm.grpc.vllm_engine_pb2.GetModelInfoRequest", "vllm.grpc.vllm_engine_pb2.GetModelInfoResponse", "vllm.grpc.vllm_engine_pb2.GetServerInfoRequest", "vllm.grpc.vllm_engine_pb2.GetServerInfoResponse", "vllm.grpc.vllm_engine_pb2.HealthCheckRequest", "vllm.grpc.vllm_engine_pb2.HealthCheckResponse", "vllm.grpc.vllm_engine_pb2.LogitBiasEntry", "vllm.grpc.vllm_engine_pb2.SamplingParams", "vllm.grpc.vllm_engine_pb2.TokenizedInput" ], "n_typable": 217, "n_typed": 217, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 66, "n_classes": 18, "n_attrs": 133, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/grpc/vllm_engine_pb2_grpc.py", "symbol_reports": [ { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2_grpc.VllmEngineServicer", "methods": [ { "kind": "function", "name": "VllmEngineServicer.Generate", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmEngineServicer.Embed", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmEngineServicer.HealthCheck", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmEngineServicer.Abort", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmEngineServicer.GetModelInfo", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VllmEngineServicer.GetServerInfo", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 18, "n_typed": 0, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2_grpc.VllmEngineStub", "methods": [ { "kind": "function", "name": "VllmEngineStub.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VllmEngineStub.Generate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmEngineStub.Embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmEngineStub.HealthCheck", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmEngineStub.Abort", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmEngineStub.GetModelInfo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VllmEngineStub.GetServerInfo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.grpc.vllm_engine_pb2_grpc.VllmEngine", "methods": [ { "kind": "function", "name": "VllmEngine.Generate", "n_typed": 0, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "VllmEngine.Embed", "n_typed": 0, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "VllmEngine.HealthCheck", "n_typed": 0, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "VllmEngine.Abort", "n_typed": 0, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "VllmEngine.GetModelInfo", "n_typed": 0, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "VllmEngine.GetServerInfo", "n_typed": 0, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 } ], "properties": [], "attrs": [], "n_typable": 66, "n_typed": 0, "n_any": 0, "n_untyped": 66, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 60, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.grpc.vllm_engine_pb2_grpc.add_VllmEngineServicer_to_server", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.grpc.vllm_engine_pb2_grpc.GRPC_GENERATED_VERSION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.grpc.vllm_engine_pb2_grpc", "names": [ "vllm.grpc.vllm_engine_pb2_grpc.GRPC_GENERATED_VERSION", "vllm.grpc.vllm_engine_pb2_grpc.VllmEngine", "vllm.grpc.vllm_engine_pb2_grpc.VllmEngineServicer", "vllm.grpc.vllm_engine_pb2_grpc.VllmEngineStub", "vllm.grpc.vllm_engine_pb2_grpc.add_VllmEngineServicer_to_server" ], "n_typable": 95, "n_typed": 0, "n_any": 0, "n_untyped": 95, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 73, "n_classes": 3, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/inputs/parse.py", "symbol_reports": [ { "kind": "function", "name": "vllm.inputs.parse.split_enc_dec_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.inputs.parse", "names": [ "vllm.inputs.parse.split_enc_dec_inputs" ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/inputs/preprocess.py", "symbol_reports": [ { "kind": "class", "name": "vllm.inputs.preprocess.InputPreprocessor", "methods": [ { "kind": "function", "name": "InputPreprocessor.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InputPreprocessor.get_tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InputPreprocessor._tokenize_prompt", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputPreprocessor._process_multimodal", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "InputPreprocessor._process_embeds", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InputPreprocessor._truncate_inputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputPreprocessor._process_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputPreprocessor._process_text", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputPreprocessor._prompt_to_llm_inputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 3, "n_typable": 3, "n_params": 2, "n_function_overloads": 3, "n_function_params": 2 }, { "kind": "function", "name": "InputPreprocessor._process_encoder_decoder_prompt", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputPreprocessor._process_decoder_only_prompt", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputPreprocessor.preprocess", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "InputPreprocessor.tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "InputPreprocessor.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputPreprocessor.renderer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputPreprocessor.mm_registry", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 41, "n_typed": 38, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 14, "n_method_params": 25, "n_attrs": 3, "n_properties": 1 }, { "kind": "attr", "name": "vllm.inputs.preprocess.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.inputs.preprocess", "names": [ "vllm.inputs.preprocess.InputPreprocessor", "vllm.inputs.preprocess.logger" ], "n_typable": 42, "n_typed": 38, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 14, "n_method_params": 25, "n_classes": 1, "n_attrs": 4, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/kernels/helion/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.kernels.helion.utils.canonicalize_gpu_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.kernels.helion.utils.get_canonical_gpu_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.kernels.helion.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.kernels.helion.utils.get_gpu_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.kernels.helion.utils", "names": [ "vllm.kernels.helion.utils.canonicalize_gpu_name", "vllm.kernels.helion.utils.get_canonical_gpu_name", "vllm.kernels.helion.utils.get_gpu_name", "vllm.kernels.helion.utils.logger" ], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/kernels/helion/register.py", "symbol_reports": [ { "kind": "function", "name": "vllm.kernels.helion.register.get_kernel_by_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.kernels.helion.register.vllm_helion_lib", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.kernels.helion.register.get_registered_kernels", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.kernels.helion.register.register_kernel", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 4, "n_params": 3, "n_function_overloads": 2, "n_function_params": 3 }, { "kind": "class", "name": "vllm.kernels.helion.register.ConfiguredHelionKernel", "methods": [ { "kind": "function", "name": "ConfiguredHelionKernel.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ConfiguredHelionKernel.__call__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ConfiguredHelionKernel._create_key_computer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConfiguredHelionKernel._create_config_selector", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConfiguredHelionKernel._load_platform_configs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConfiguredHelionKernel._create_decorated_kernel", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ConfiguredHelionKernel.op_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConfiguredHelionKernel.config_picker", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConfiguredHelionKernel.raw_kernel_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConfiguredHelionKernel.helion_settings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 6, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 7, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.kernels.helion.register.HelionKernelWrapper", "methods": [ { "kind": "function", "name": "HelionKernelWrapper.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "HelionKernelWrapper.__call__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HelionKernelWrapper._call_via_hop", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HelionKernelWrapper._partition_args", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "HelionKernelWrapper.register_config_picker", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HelionKernelWrapper.register_input_generator", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HelionKernelWrapper.get_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HelionKernelWrapper.run_autotune", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HelionKernelWrapper.get_configured_op", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HelionKernelWrapper._get_or_register_custom_op", "n_typed": 0, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HelionKernelWrapper.raw_kernel_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HelionKernelWrapper.op_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HelionKernelWrapper.helion_settings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 18, "n_any": 3, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 15, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.kernels.helion.register.PresetConfigSearch", "methods": [ { "kind": "function", "name": "PresetConfigSearch.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PresetConfigSearch.autotune", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PresetConfigSearch.args", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PresetConfigSearch.config_selector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 4, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.kernels.helion.register.create_helion_decorated_kernel", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.kernels.helion.register.infer_fake_impl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.kernels.helion.register.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.kernels.helion.register.validate_helion_settings", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.kernels.helion.register", "names": [ "vllm.kernels.helion.register.ConfiguredHelionKernel", "vllm.kernels.helion.register.HelionKernelWrapper", "vllm.kernels.helion.register.PresetConfigSearch", "vllm.kernels.helion.register.create_helion_decorated_kernel", "vllm.kernels.helion.register.get_kernel_by_name", "vllm.kernels.helion.register.get_registered_kernels", "vllm.kernels.helion.register.infer_fake_impl", "vllm.kernels.helion.register.logger", "vllm.kernels.helion.register.register_kernel", "vllm.kernels.helion.register.validate_helion_settings", "vllm.kernels.helion.register.vllm_helion_lib" ], "n_typable": 71, "n_typed": 44, "n_any": 4, "n_untyped": 23, "n_functions": 6, "n_function_overloads": 7, "n_function_params": 11, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 25, "n_classes": 3, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/kernels/helion/config_manager.py", "symbol_reports": [ { "kind": "class", "name": "vllm.kernels.helion.config_manager.ConfigSet", "methods": [ { "kind": "function", "name": "ConfigSet.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConfigSet.get_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ConfigSet.get_platforms", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConfigSet.get_config_keys", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConfigSet.to_dict", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConfigSet.from_dict", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ConfigSet.set_config", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ConfigSet.has_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "ConfigSet.kernel_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ConfigSet._ConfigDict", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 20, "n_typed": 19, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 11, "n_attrs": 1, "n_properties": 1 }, { "kind": "class", "name": "vllm.kernels.helion.config_manager.ConfigManager", "methods": [ { "kind": "function", "name": "ConfigManager.__new__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConfigManager.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConfigManager._resolve_base_dir", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConfigManager.get_instance", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConfigManager.reset_instance", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConfigManager.get_config_file_path", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConfigManager.ensure_base_dir_exists", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConfigManager.ensure_base_dir_writable", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConfigManager.load_config_set", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConfigManager.get_platform_configs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ConfigManager.save_config_set", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConfigManager.save_configs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ConfigManager.config_exists", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ConfigManager._instance", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ConfigManager._instance_base_dir", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 29, "n_typed": 28, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 14, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.kernels.helion.config_manager.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.kernels.helion.config_manager", "names": [ "vllm.kernels.helion.config_manager.ConfigManager", "vllm.kernels.helion.config_manager.ConfigSet", "vllm.kernels.helion.config_manager.logger" ], "n_typable": 50, "n_typed": 47, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 25, "n_classes": 2, "n_attrs": 4, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/kernels/helion/ops/silu_mul_fp8.py", "symbol_reports": [ { "kind": "function", "name": "vllm.kernels.helion.ops.silu_mul_fp8.generate_silu_mul_fp8_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.kernels.helion.ops.silu_mul_fp8.silu_mul_fp8_baseline", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.kernels.helion.ops.silu_mul_fp8.silu_mul_fp8", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.kernels.helion.ops.silu_mul_fp8.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.kernels.helion.ops.silu_mul_fp8.pick_silu_mul_fp8_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [ { "kind": "type", "rules": [ "misc" ] }, { "kind": "type", "rules": [ "misc" ] }, { "kind": "type", "rules": [ "misc" ] } ], "name": "vllm.kernels.helion.ops.silu_mul_fp8", "names": [ "vllm.kernels.helion.ops.silu_mul_fp8.generate_silu_mul_fp8_inputs", "vllm.kernels.helion.ops.silu_mul_fp8.logger", "vllm.kernels.helion.ops.silu_mul_fp8.pick_silu_mul_fp8_config", "vllm.kernels.helion.ops.silu_mul_fp8.silu_mul_fp8", "vllm.kernels.helion.ops.silu_mul_fp8.silu_mul_fp8_baseline" ], "n_typable": 11, "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 3 }, { "path": "vllm/logger.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.logger.DEFAULT_LOGGING_CONFIG", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.logger.init_logger", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.logger.current_formatter_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.logger.LogScope", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.logger.suppress_logging", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.logger.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.logger.enable_trace_function_call", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.logger", "names": [ "vllm.logger.DEFAULT_LOGGING_CONFIG", "vllm.logger.LogScope", "vllm.logger.current_formatter_type", "vllm.logger.enable_trace_function_call", "vllm.logger.init_logger", "vllm.logger.logger", "vllm.logger.suppress_logging" ], "n_typable": 12, "n_typed": 10, "n_any": 0, "n_untyped": 2, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 5, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/logging_utils/lazy.py", "symbol_reports": [ { "kind": "class", "name": "vllm.logging_utils.lazy.lazy", "methods": [ { "kind": "function", "name": "lazy.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "lazy.__str__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "lazy.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.logging_utils.lazy", "names": [ "vllm.logging_utils.lazy.lazy" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/logging_utils/formatter.py", "symbol_reports": [ { "kind": "class", "name": "vllm.logging_utils.formatter.ColoredFormatter", "methods": [ { "kind": "function", "name": "ColoredFormatter.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ColoredFormatter.format", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ColoredFormatter.COLORS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ColoredFormatter.GREY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ColoredFormatter.RESET", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.logging_utils.formatter.NewLineFormatter", "methods": [ { "kind": "function", "name": "NewLineFormatter.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "NewLineFormatter.format", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NewLineFormatter.use_relpath", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NewLineFormatter.root_dir", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.logging_utils.formatter", "names": [ "vllm.logging_utils.formatter.ColoredFormatter", "vllm.logging_utils.formatter.NewLineFormatter" ], "n_typable": 14, "n_typed": 0, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_classes": 2, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/logging_utils/access_log_filter.py", "symbol_reports": [ { "kind": "function", "name": "vllm.logging_utils.access_log_filter.create_uvicorn_log_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.logging_utils.access_log_filter.UvicornAccessLogFilter", "methods": [ { "kind": "function", "name": "UvicornAccessLogFilter.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UvicornAccessLogFilter.filter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "UvicornAccessLogFilter.excluded_paths", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.logging_utils.access_log_filter", "names": [ "vllm.logging_utils.access_log_filter.UvicornAccessLogFilter", "vllm.logging_utils.access_log_filter.create_uvicorn_log_config" ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/logging_utils/log_time.py", "symbol_reports": [ { "kind": "function", "name": "vllm.logging_utils.log_time.logtime", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.logging_utils.log_time", "names": [ "vllm.logging_utils.log_time.logtime" ], "n_typable": 3, "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/logging_utils/dump_input.py", "symbol_reports": [ { "kind": "function", "name": "vllm.logging_utils.dump_input.dump_engine_exception", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.logging_utils.dump_input.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.logging_utils.dump_input.prepare_object_to_dump", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.logging_utils.dump_input", "names": [ "vllm.logging_utils.dump_input.dump_engine_exception", "vllm.logging_utils.dump_input.logger", "vllm.logging_utils.dump_input.prepare_object_to_dump" ], "n_typable": 7, "n_typed": 4, "n_any": 0, "n_untyped": 3, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 4, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/logits_process.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.logits_process.LogitsProcessor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.logits_process.get_bad_words_logits_processors", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.logits_process.NoBadWordsLogitsProcessor", "methods": [ { "kind": "function", "name": "NoBadWordsLogitsProcessor.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NoBadWordsLogitsProcessor.__call__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NoBadWordsLogitsProcessor._init_word_bias", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NoBadWordsLogitsProcessor._check_token_ids_bounds", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NoBadWordsLogitsProcessor._SMALLEST_LOGIT", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NoBadWordsLogitsProcessor._NEUTRAL_LOGIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NoBadWordsLogitsProcessor.bad_words_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NoBadWordsLogitsProcessor.word_bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.logits_process", "names": [ "vllm.logits_process.LogitsProcessor", "vllm.logits_process.NoBadWordsLogitsProcessor", "vllm.logits_process.get_bad_words_logits_processors" ], "n_typable": 16, "n_typed": 13, "n_any": 0, "n_untyped": 3, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_classes": 1, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/logprobs.py", "symbol_reports": [ { "kind": "function", "name": "vllm.logprobs.create_sample_logprobs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.logprobs.FlatLogprobs", "methods": [ { "kind": "function", "name": "FlatLogprobs.append", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlatLogprobs.append_fast", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlatLogprobs.extend", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlatLogprobs.__len__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlatLogprobs.__getitem__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 3, "n_params": 2, "n_function_overloads": 2, "n_function_params": 2 }, { "kind": "function", "name": "FlatLogprobs.__setitem__", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlatLogprobs.__delitem__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlatLogprobs.insert", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlatLogprobs.__iter__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlatLogprobs.start_indices", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlatLogprobs.end_indices", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlatLogprobs.token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlatLogprobs.logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlatLogprobs.ranks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlatLogprobs.decoded_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 22, "n_typed": 18, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 10, "n_method_params": 13, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.logprobs.LogprobsOnePosition", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.logprobs.append_logprobs_for_next_position", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "attr", "name": "vllm.logprobs.SampleLogprobs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.logprobs.create_prompt_logprobs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.logprobs.PromptLogprobs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.logprobs.Logprob", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Logprob.logprob", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Logprob.rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Logprob.decoded_token", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.logprobs", "names": [ "vllm.logprobs.FlatLogprobs", "vllm.logprobs.Logprob", "vllm.logprobs.LogprobsOnePosition", "vllm.logprobs.PromptLogprobs", "vllm.logprobs.SampleLogprobs", "vllm.logprobs.append_logprobs_for_next_position", "vllm.logprobs.create_prompt_logprobs", "vllm.logprobs.create_sample_logprobs" ], "n_typable": 33, "n_typed": 29, "n_any": 0, "n_untyped": 4, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 8, "n_methods": 9, "n_method_overloads": 10, "n_method_params": 13, "n_classes": 2, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/layers/utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.layers.utils.LoRAMappingType", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LoRAMappingType.LANGUAGE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoRAMappingType.TOWER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoRAMappingType.CONNECTOR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.lora.layers.utils.LoRAMapping", "methods": [ { "kind": "function", "name": "LoRAMapping.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LoRAMapping.index_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoRAMapping.prompt_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoRAMapping.is_prefill", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoRAMapping.type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.lora.layers.utils.try_get_optimal_moe_lora_config", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "type_ignores": [], "name": "vllm.lora.layers.utils", "names": [ "vllm.lora.layers.utils.LoRAMapping", "vllm.lora.layers.utils.LoRAMappingType", "vllm.lora.layers.utils.try_get_optimal_moe_lora_config" ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 8, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_classes": 2, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/layers/column_parallel_linear.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.layers.column_parallel_linear.QKVParallelLinearWithLoRA", "methods": [ { "kind": "function", "name": "QKVParallelLinearWithLoRA.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QKVParallelLinearWithLoRA.slice_lora_b", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QKVParallelLinearWithLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QKVParallelLinearWithLoRA.q_proj_total_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QKVParallelLinearWithLoRA.q_proj_shard_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QKVParallelLinearWithLoRA.kv_proj_shard_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QKVParallelLinearWithLoRA.kv_proj_total_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QKVParallelLinearWithLoRA.n_slices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.lora.layers.column_parallel_linear.MergedQKVParallelLinearWithShardedLoRA", "methods": [ { "kind": "function", "name": "MergedQKVParallelLinearWithShardedLoRA.slice_lora_a", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MergedQKVParallelLinearWithShardedLoRA.apply", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MergedQKVParallelLinearWithShardedLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.lora.layers.column_parallel_linear.MergedQKVParallelLinearWithLoRA", "methods": [ { "kind": "function", "name": "MergedQKVParallelLinearWithLoRA.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MergedQKVParallelLinearWithLoRA.create_lora_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MergedQKVParallelLinearWithLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MergedQKVParallelLinearWithLoRA.n_slices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MergedQKVParallelLinearWithLoRA.q_proj_shard_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MergedQKVParallelLinearWithLoRA.kv_proj_shard_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MergedQKVParallelLinearWithLoRA.q_shard_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MergedQKVParallelLinearWithLoRA.kv_shard_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MergedQKVParallelLinearWithLoRA.output_slices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MergedQKVParallelLinearWithLoRA.output_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.lora.layers.column_parallel_linear.MergedColumnParallelLinearWithShardedLoRA", "methods": [ { "kind": "function", "name": "MergedColumnParallelLinearWithShardedLoRA.slice_lora_a", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MergedColumnParallelLinearWithShardedLoRA.apply", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MergedColumnParallelLinearWithShardedLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.lora.layers.column_parallel_linear.MergedColumnParallelLinearWithLoRA", "methods": [ { "kind": "function", "name": "MergedColumnParallelLinearWithLoRA.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MergedColumnParallelLinearWithLoRA.create_lora_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MergedColumnParallelLinearWithLoRA.slice_lora_a", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MergedColumnParallelLinearWithLoRA.slice_lora_b", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MergedColumnParallelLinearWithLoRA.set_lora", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MergedColumnParallelLinearWithLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MergedColumnParallelLinearWithLoRA.output_slices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MergedColumnParallelLinearWithLoRA.n_slices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MergedColumnParallelLinearWithLoRA.output_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 18, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 13, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.lora.layers.column_parallel_linear.ColumnParallelLinearWithShardedLoRA", "methods": [ { "kind": "function", "name": "ColumnParallelLinearWithShardedLoRA.slice_lora_a", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColumnParallelLinearWithShardedLoRA.apply", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ColumnParallelLinearWithShardedLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.lora.layers.column_parallel_linear.QKVParallelLinearWithShardedLoRA", "methods": [ { "kind": "function", "name": "QKVParallelLinearWithShardedLoRA.slice_lora_a", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QKVParallelLinearWithShardedLoRA.apply", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QKVParallelLinearWithShardedLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.lora.layers.column_parallel_linear.ColumnParallelLinearWithLoRA", "methods": [ { "kind": "function", "name": "ColumnParallelLinearWithLoRA.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColumnParallelLinearWithLoRA.slice_lora_a", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColumnParallelLinearWithLoRA.slice_lora_b", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColumnParallelLinearWithLoRA.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColumnParallelLinearWithLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ColumnParallelLinearWithLoRA.is_merged_col_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColumnParallelLinearWithLoRA.output_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColumnParallelLinearWithLoRA.n_slices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 13, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.lora.layers.column_parallel_linear.MergedColumnParallelLinearVariableSliceWithLoRA", "methods": [ { "kind": "function", "name": "MergedColumnParallelLinearVariableSliceWithLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MergedColumnParallelLinearVariableSliceWithLoRA.set_lora", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.lora.layers.column_parallel_linear", "names": [ "vllm.lora.layers.column_parallel_linear.ColumnParallelLinearWithLoRA", "vllm.lora.layers.column_parallel_linear.ColumnParallelLinearWithShardedLoRA", "vllm.lora.layers.column_parallel_linear.MergedColumnParallelLinearVariableSliceWithLoRA", "vllm.lora.layers.column_parallel_linear.MergedColumnParallelLinearWithLoRA", "vllm.lora.layers.column_parallel_linear.MergedColumnParallelLinearWithShardedLoRA", "vllm.lora.layers.column_parallel_linear.MergedQKVParallelLinearWithLoRA", "vllm.lora.layers.column_parallel_linear.MergedQKVParallelLinearWithShardedLoRA", "vllm.lora.layers.column_parallel_linear.QKVParallelLinearWithLoRA", "vllm.lora.layers.column_parallel_linear.QKVParallelLinearWithShardedLoRA" ], "n_typable": 119, "n_typed": 99, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 31, "n_method_overloads": 31, "n_method_params": 70, "n_classes": 9, "n_attrs": 18, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/layers/replicated_linear.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.layers.replicated_linear.ReplicatedLinearWithLoRA", "methods": [ { "kind": "function", "name": "ReplicatedLinearWithLoRA.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ReplicatedLinearWithLoRA.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ReplicatedLinearWithLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ReplicatedLinearWithLoRA.slice_lora_a", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ReplicatedLinearWithLoRA.slice_lora_b", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ReplicatedLinearWithLoRA.output_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ReplicatedLinearWithLoRA.n_slices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 13, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.lora.layers.replicated_linear", "names": [ "vllm.lora.layers.replicated_linear.ReplicatedLinearWithLoRA" ], "n_typable": 15, "n_typed": 13, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/layers/vocal_parallel_embedding.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.layers.vocal_parallel_embedding.VocabParallelEmbeddingWithLoRA", "methods": [ { "kind": "function", "name": "VocabParallelEmbeddingWithLoRA.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VocabParallelEmbeddingWithLoRA.create_lora_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VocabParallelEmbeddingWithLoRA.reset_lora", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VocabParallelEmbeddingWithLoRA.set_lora", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VocabParallelEmbeddingWithLoRA.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VocabParallelEmbeddingWithLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "VocabParallelEmbeddingWithLoRA.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "VocabParallelEmbeddingWithLoRA.base_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VocabParallelEmbeddingWithLoRA.embeddings_slice", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VocabParallelEmbeddingWithLoRA.embeddings_weights", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 23, "n_typed": 19, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 13, "n_attrs": 3, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.lora.layers.vocal_parallel_embedding", "names": [ "vllm.lora.layers.vocal_parallel_embedding.VocabParallelEmbeddingWithLoRA" ], "n_typable": 23, "n_typed": 19, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 13, "n_classes": 1, "n_attrs": 3, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/lora/layers/fused_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.layers.fused_moe.FusedMoE3DWithLoRA", "methods": [ { "kind": "function", "name": "FusedMoE3DWithLoRA.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoE3DWithLoRA._create_lora_b_weights", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoE3DWithLoRA.create_lora_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FusedMoE3DWithLoRA._slice_w13_b", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoE3DWithLoRA.set_lora", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FusedMoE3DWithLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "FusedMoE3DWithLoRA.w13_input_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoE3DWithLoRA.w13_output_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoE3DWithLoRA.w2_input_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoE3DWithLoRA.w2_output_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [], "n_typable": 24, "n_typed": 13, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_attrs": 0, "n_properties": 4 }, { "kind": "class", "name": "vllm.lora.layers.fused_moe.FusedMoEWithLoRA", "methods": [ { "kind": "function", "name": "FusedMoEWithLoRA.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEWithLoRA._normalize_keys", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEWithLoRA._get_lora_moe_configs", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "FusedMoEWithLoRA._inject_lora_into_fused_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEWithLoRA._create_lora_a_weights", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoEWithLoRA._create_lora_b_weights", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoEWithLoRA.create_lora_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FusedMoEWithLoRA._slice_w13_a", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEWithLoRA._slice_w13_b", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEWithLoRA._slice_w2_a", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEWithLoRA._slice_w2_b", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEWithLoRA.reset_lora", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEWithLoRA.set_lora", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FusedMoEWithLoRA.forward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoEWithLoRA.maybe_all_reduce_tensor_model_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoEWithLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "FusedMoEWithLoRA._shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEWithLoRA.quant_method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEWithLoRA.is_internal_router", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FusedMoEWithLoRA.base_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEWithLoRA.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEWithLoRA.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEWithLoRA.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 56, "n_typed": 37, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 33, "n_attrs": 4, "n_properties": 3 } ], "type_ignores": [], "name": "vllm.lora.layers.fused_moe", "names": [ "vllm.lora.layers.fused_moe.FusedMoE3DWithLoRA", "vllm.lora.layers.fused_moe.FusedMoEWithLoRA" ], "n_typable": 80, "n_typed": 50, "n_any": 0, "n_untyped": 30, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 22, "n_method_overloads": 22, "n_method_params": 47, "n_classes": 2, "n_attrs": 4, "n_properties": 7, "n_type_ignores": 0 }, { "path": "vllm/lora/layers/row_parallel_linear.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.layers.row_parallel_linear.RowParallelLinearWithShardedLoRA", "methods": [ { "kind": "function", "name": "RowParallelLinearWithShardedLoRA.slice_lora_b", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RowParallelLinearWithShardedLoRA.apply", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RowParallelLinearWithShardedLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.lora.layers.row_parallel_linear.RowParallelLinearWithLoRA", "methods": [ { "kind": "function", "name": "RowParallelLinearWithLoRA.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RowParallelLinearWithLoRA.slice_lora_a", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RowParallelLinearWithLoRA.slice_lora_b", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RowParallelLinearWithLoRA.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RowParallelLinearWithLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RowParallelLinearWithLoRA.input_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RowParallelLinearWithLoRA.output_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RowParallelLinearWithLoRA.n_slices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 13, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.lora.layers.row_parallel_linear", "names": [ "vllm.lora.layers.row_parallel_linear.RowParallelLinearWithLoRA", "vllm.lora.layers.row_parallel_linear.RowParallelLinearWithShardedLoRA" ], "n_typable": 26, "n_typed": 23, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 15, "n_classes": 2, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/layers/base.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.layers.base.BaseLayerWithLoRA", "methods": [ { "kind": "function", "name": "BaseLayerWithLoRA.slice_lora_a", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseLayerWithLoRA.slice_lora_b", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseLayerWithLoRA.create_lora_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseLayerWithLoRA.reset_lora", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseLayerWithLoRA.set_lora", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseLayerWithLoRA.set_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseLayerWithLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 21, "n_typed": 17, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 14, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.lora.layers.base", "names": [ "vllm.lora.layers.base.BaseLayerWithLoRA" ], "n_typable": 21, "n_typed": 17, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 14, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/layers/logits_processor.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.layers.logits_processor.LogitsProcessorWithLoRA", "methods": [ { "kind": "function", "name": "LogitsProcessorWithLoRA.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LogitsProcessorWithLoRA.create_lora_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LogitsProcessorWithLoRA.reset_lora", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LogitsProcessorWithLoRA.set_lora", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LogitsProcessorWithLoRA._get_logits", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LogitsProcessorWithLoRA.forward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LogitsProcessorWithLoRA.can_replace_layer", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "LogitsProcessorWithLoRA.logits_as_input", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "LogitsProcessorWithLoRA.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "LogitsProcessorWithLoRA.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "LogitsProcessorWithLoRA.soft_cap", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "LogitsProcessorWithLoRA.use_all_gather", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "LogitsProcessorWithLoRA.org_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "LogitsProcessorWithLoRA.include_gpu_probs_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "LogitsProcessorWithLoRA.should_modify_greedy_probs_inplace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "LogitsProcessorWithLoRA.base_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitsProcessorWithLoRA.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitsProcessorWithLoRA.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitsProcessorWithLoRA.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitsProcessorWithLoRA.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitsProcessorWithLoRA.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitsProcessorWithLoRA.sharded_to_full_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 43, "n_typed": 23, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 21, "n_attrs": 7, "n_properties": 8 } ], "type_ignores": [], "name": "vllm.lora.layers.logits_processor", "names": [ "vllm.lora.layers.logits_processor.LogitsProcessorWithLoRA" ], "n_typable": 43, "n_typed": 23, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 21, "n_classes": 1, "n_attrs": 7, "n_properties": 8, "n_type_ignores": 0 }, { "path": "vllm/lora/layers/base_linear.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.layers.base_linear.BaseLinearLayerWithLoRA", "methods": [ { "kind": "function", "name": "BaseLinearLayerWithLoRA.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseLinearLayerWithLoRA.create_lora_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseLinearLayerWithLoRA.reset_lora", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseLinearLayerWithLoRA.set_lora", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseLinearLayerWithLoRA.apply", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "BaseLinearLayerWithLoRA.weight", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "BaseLinearLayerWithLoRA.bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "BaseLinearLayerWithLoRA.base_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseLinearLayerWithLoRA.input_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseLinearLayerWithLoRA.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseLinearLayerWithLoRA.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseLinearLayerWithLoRA.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseLinearLayerWithLoRA.output_slices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseLinearLayerWithLoRA.output_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseLinearLayerWithLoRA.n_slices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 25, "n_typed": 17, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 8, "n_properties": 2 } ], "type_ignores": [], "name": "vllm.lora.layers.base_linear", "names": [ "vllm.lora.layers.base_linear.BaseLinearLayerWithLoRA" ], "n_typable": 25, "n_typed": 17, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_classes": 1, "n_attrs": 8, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/lora/lora_model.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.lora_model.LoRAModel", "methods": [ { "kind": "function", "name": "LoRAModel.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LoRAModel.clone", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModel.get_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModel.check_lora_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModel._should_skip_module", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LoRAModel.from_lora_tensors", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "LoRAModel.from_local_checkpoint", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LoRAModel.id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRAModel.rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRAModel.loras", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 36, "n_typed": 34, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 26, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.lora.lora_model.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.lora.lora_model", "names": [ "vllm.lora.lora_model.LoRAModel", "vllm.lora.lora_model.logger" ], "n_typable": 37, "n_typed": 34, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 26, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/lora_weights.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.lora_weights.LoRALayerWeights", "methods": [ { "kind": "function", "name": "LoRALayerWeights.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "LoRALayerWeights.optimize", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoRALayerWeights.from_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LoRALayerWeights.create_dummy_lora_weights", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "LoRALayerWeights.input_dim", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "LoRALayerWeights.output_dim", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "LoRALayerWeights.is_packed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "LoRALayerWeights.module_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRALayerWeights.rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRALayerWeights.lora_alpha", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRALayerWeights.lora_a", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRALayerWeights.lora_b", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRALayerWeights.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 21, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 14, "n_attrs": 6, "n_properties": 3 }, { "kind": "class", "name": "vllm.lora.lora_weights.PackedLoRALayerWeights", "methods": [ { "kind": "function", "name": "PackedLoRALayerWeights.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "PackedLoRALayerWeights.pack", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PackedLoRALayerWeights.pack_moe", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PackedLoRALayerWeights.optimize", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "PackedLoRALayerWeights.input_dim", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PackedLoRALayerWeights.output_dim", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PackedLoRALayerWeights.is_packed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "PackedLoRALayerWeights.lora_alphas", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PackedLoRALayerWeights.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 17, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 2, "n_properties": 3 } ], "type_ignores": [], "name": "vllm.lora.lora_weights", "names": [ "vllm.lora.lora_weights.LoRALayerWeights", "vllm.lora.lora_weights.PackedLoRALayerWeights" ], "n_typable": 46, "n_typed": 38, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 24, "n_classes": 2, "n_attrs": 8, "n_properties": 6, "n_type_ignores": 0 }, { "path": "vllm/lora/model_manager.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.lora.model_manager.DEFAULT_LANGUAGE_WRAPPER_KEY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.lora.model_manager.T", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.lora.model_manager.LRUCacheLoRAModelManager", "methods": [ { "kind": "function", "name": "LRUCacheLoRAModelManager.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "LRUCacheLoRAModelManager.list_adapters", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LRUCacheLoRAModelManager.add_adapter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUCacheLoRAModelManager.activate_adapter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUCacheLoRAModelManager.remove_oldest_adapter", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LRUCacheLoRAModelManager.pin_adapter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUCacheLoRAModelManager._pin_lora_in_cpu_cache", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUCacheLoRAModelManager._pin_lora_in_gpu_cache", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 20, "n_typed": 17, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 12, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.lora.model_manager.create_lora_manager", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "class", "name": "vllm.lora.model_manager.AdapterLRUCache", "methods": [ { "kind": "function", "name": "AdapterLRUCache.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AdapterLRUCache._on_remove", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AdapterLRUCache.deactivate_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 4, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.lora.model_manager.LoRALRUCache", "methods": [ { "kind": "function", "name": "LoRALRUCache.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.lora.model_manager.LoRAModelManager", "methods": [ { "kind": "function", "name": "LoRAModelManager.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "LoRAModelManager._init_punica_wrapper", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LoRAModelManager._maybe_init_mm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LoRAModelManager.__len__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoRAModelManager.activate_adapter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelManager._deactivate_adapter", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelManager._add_adapter", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelManager.pin_adapter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelManager._set_adapter_mapping", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelManager.remove_all_adapters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoRAModelManager._create_lora_modules", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoRAModelManager.register_module", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LoRAModelManager._pad_lora_pairs_to_triplets", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelManager.create_dummy_lora", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LoRAModelManager._match_target_modules", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelManager._get_punica_wrapper", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelManager._register_packed_modules", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelManager._create_merged_loras_inplace", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelManager._stack_moe_lora_weights", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LoRAModelManager._get_lora_layer_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LoRAModelManager.deactivate_adapter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelManager.add_adapter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelManager.set_adapter_mapping", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelManager.remove_adapter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelManager.list_adapters", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoRAModelManager.get_adapter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "LoRAModelManager.capacity", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "LoRAModelManager.lora_slots", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "LoRAModelManager.adapter_slots", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "LoRAModelManager.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRAModelManager.supported_lora_modules", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRAModelManager.adapter_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRAModelManager.lora_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRAModelManager.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRAModelManager.max_num_seqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRAModelManager.max_num_batched_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRAModelManager.lora_index_to_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRAModelManager.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRAModelManager.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRAModelManager.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRAModelManager.packed_modules", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRAModelManager.modules", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 78, "n_typed": 61, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 26, "n_method_overloads": 26, "n_method_params": 36, "n_attrs": 13, "n_properties": 3 }, { "kind": "attr", "name": "vllm.lora.model_manager.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.lora.model_manager", "names": [ "vllm.lora.model_manager.AdapterLRUCache", "vllm.lora.model_manager.DEFAULT_LANGUAGE_WRAPPER_KEY", "vllm.lora.model_manager.LRUCacheLoRAModelManager", "vllm.lora.model_manager.LoRALRUCache", "vllm.lora.model_manager.LoRAModelManager", "vllm.lora.model_manager.T", "vllm.lora.model_manager.create_lora_manager", "vllm.lora.model_manager.logger" ], "n_typable": 119, "n_typed": 93, "n_any": 0, "n_untyped": 26, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 9, "n_methods": 37, "n_method_overloads": 37, "n_method_params": 54, "n_classes": 4, "n_attrs": 17, "n_properties": 3, "n_type_ignores": 0 }, { "path": "vllm/lora/ops/torch_ops/lora_ops.py", "symbol_reports": [ { "kind": "function", "name": "vllm.lora.ops.torch_ops.lora_ops.sgmv_shrink", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "vllm.lora.ops.torch_ops.lora_ops.bgmv_expand_slice", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.lora.ops.torch_ops.lora_ops.bgmv_shrink", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.lora.ops.torch_ops.lora_ops.sgmv_expand", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "vllm.lora.ops.torch_ops.lora_ops.sgmv_expand_slice", "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "vllm.lora.ops.torch_ops.lora_ops.bgmv_expand", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.lora.ops.torch_ops.lora_ops", "names": [ "vllm.lora.ops.torch_ops.lora_ops.bgmv_expand", "vllm.lora.ops.torch_ops.lora_ops.bgmv_expand_slice", "vllm.lora.ops.torch_ops.lora_ops.bgmv_shrink", "vllm.lora.ops.torch_ops.lora_ops.sgmv_expand", "vllm.lora.ops.torch_ops.lora_ops.sgmv_expand_slice", "vllm.lora.ops.torch_ops.lora_ops.sgmv_shrink" ], "n_typable": 55, "n_typed": 49, "n_any": 0, "n_untyped": 6, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 49, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/ops/triton_ops/__init__.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.lora.ops.triton_ops.fused_moe_lora_expand_fp8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.lora.ops.triton_ops.fused_moe_lora_fp8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.lora.ops.triton_ops.fused_moe_lora_shrink", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.lora.ops.triton_ops.fused_moe_lora", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.lora.ops.triton_ops.fused_moe_lora_shrink_fp8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.lora.ops.triton_ops.lora_expand", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.lora.ops.triton_ops.fused_moe_lora_expand", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.lora.ops.triton_ops.lora_shrink", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.lora.ops.triton_ops", "names": [ "vllm.lora.ops.triton_ops.fused_moe_lora", "vllm.lora.ops.triton_ops.fused_moe_lora_expand", "vllm.lora.ops.triton_ops.fused_moe_lora_expand_fp8", "vllm.lora.ops.triton_ops.fused_moe_lora_fp8", "vllm.lora.ops.triton_ops.fused_moe_lora_shrink", "vllm.lora.ops.triton_ops.fused_moe_lora_shrink_fp8", "vllm.lora.ops.triton_ops.lora_expand", "vllm.lora.ops.triton_ops.lora_shrink" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/ops/triton_ops/lora_kernel_metadata.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.ops.triton_ops.lora_kernel_metadata.LoRAKernelMeta", "methods": [ { "kind": "function", "name": "LoRAKernelMeta.make", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LoRAKernelMeta._reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoRAKernelMeta.prepare_tensors", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAKernelMeta.meta_args", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LoRAKernelMeta.token_lora_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoRAKernelMeta.token_indices_sorted_by_lora_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoRAKernelMeta.active_lora_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoRAKernelMeta.num_tokens_per_lora", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoRAKernelMeta.lora_token_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoRAKernelMeta.no_lora_flag_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoRAKernelMeta.num_active_loras_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoRAKernelMeta.default_num_active_loras_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoRAKernelMeta.captured_lora_counts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 11, "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.lora.ops.triton_ops.lora_kernel_metadata", "names": [ "vllm.lora.ops.triton_ops.lora_kernel_metadata.LoRAKernelMeta" ], "n_typable": 11, "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_classes": 1, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/ops/triton_ops/kernel_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.lora.ops.triton_ops.kernel_utils.do_expand_kernel", "n_typed": 9, "n_any": 0, "n_untyped": 20, "n_overloads": 1, "n_typable": 29, "n_params": 28, "n_function_overloads": 1, "n_function_params": 28 }, { "kind": "function", "name": "vllm.lora.ops.triton_ops.kernel_utils.do_shrink_kernel", "n_typed": 7, "n_any": 0, "n_untyped": 21, "n_overloads": 1, "n_typable": 28, "n_params": 27, "n_function_overloads": 1, "n_function_params": 27 }, { "kind": "function", "name": "vllm.lora.ops.triton_ops.kernel_utils.mm_k", "n_typed": 9, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "type_ignores": [], "name": "vllm.lora.ops.triton_ops.kernel_utils", "names": [ "vllm.lora.ops.triton_ops.kernel_utils.do_expand_kernel", "vllm.lora.ops.triton_ops.kernel_utils.do_shrink_kernel", "vllm.lora.ops.triton_ops.kernel_utils.mm_k" ], "n_typable": 73, "n_typed": 25, "n_any": 0, "n_untyped": 48, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 70, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/ops/triton_ops/utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.lora.ops.triton_ops.utils.is_batch_invariant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.lora.ops.triton_ops.utils.load_lora_op_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.lora.ops.triton_ops.utils.supports_tma", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.lora.ops.triton_ops.utils.get_lora_op_configs", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.lora.ops.triton_ops.utils.supports_pdl", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.lora.ops.triton_ops.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.lora.ops.triton_ops.utils", "names": [ "vllm.lora.ops.triton_ops.utils.get_lora_op_configs", "vllm.lora.ops.triton_ops.utils.is_batch_invariant", "vllm.lora.ops.triton_ops.utils.load_lora_op_config", "vllm.lora.ops.triton_ops.utils.logger", "vllm.lora.ops.triton_ops.utils.supports_pdl", "vllm.lora.ops.triton_ops.utils.supports_tma" ], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 12, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/ops/xpu_ops/lora_ops.py", "symbol_reports": [ { "kind": "function", "name": "vllm.lora.ops.xpu_ops.lora_ops.bgmv_expand", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.lora.ops.xpu_ops.lora_ops.bgmv_expand_slice", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.lora.ops.xpu_ops.lora_ops.bgmv_shrink", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.lora.ops.xpu_ops.lora_ops.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.lora.ops.xpu_ops.lora_ops", "names": [ "vllm.lora.ops.xpu_ops.lora_ops.bgmv_expand", "vllm.lora.ops.xpu_ops.lora_ops.bgmv_expand_slice", "vllm.lora.ops.xpu_ops.lora_ops.bgmv_shrink", "vllm.lora.ops.xpu_ops.lora_ops.logger" ], "n_typable": 21, "n_typed": 20, "n_any": 0, "n_untyped": 1, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 17, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/peft_helper.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.lora.peft_helper.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.lora.peft_helper.PEFTHelper", "methods": [ { "kind": "function", "name": "PEFTHelper._validate_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PEFTHelper.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PEFTHelper.from_dict", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PEFTHelper.from_local_dir", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PEFTHelper.validate_legal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PEFTHelper.r", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PEFTHelper.lora_alpha", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PEFTHelper.target_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PEFTHelper.bias", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PEFTHelper.modules_to_save", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PEFTHelper.use_rslora", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PEFTHelper.use_dora", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PEFTHelper.vllm_lora_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PEFTHelper.vllm_max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 5, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.lora.peft_helper", "names": [ "vllm.lora.peft_helper.PEFTHelper", "vllm.lora.peft_helper.logger" ], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 5, "n_classes": 1, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/punica_wrapper/punica_base.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.punica_wrapper.punica_base.PunicaWrapperBase", "methods": [ { "kind": "function", "name": "PunicaWrapperBase.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PunicaWrapperBase._update_base_metadata", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PunicaWrapperBase._update_prefill_metadata", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PunicaWrapperBase.update_metadata", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PunicaWrapperBase.add_shrink", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PunicaWrapperBase.add_expand", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "PunicaWrapperBase.add_lora_embedding", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PunicaWrapperBase.add_lora_linear", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "PunicaWrapperBase.add_lora_logits", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "PunicaWrapperBase.moe_lora_align_block_size", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "PunicaWrapperBase.add_lora_fused_moe", "n_typed": 14, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 } ], "properties": [ { "kind": "property", "name": "PunicaWrapperBase.prefill_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PunicaWrapperBase.token_lora_indices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PunicaWrapperBase.sampler_indices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PunicaWrapperBase.sampler_indices_padded", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PunicaWrapperBase.embeddings_indices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "PunicaWrapperBase.indices_len", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PunicaWrapperBase.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PunicaWrapperBase.max_length", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PunicaWrapperBase.token_nums", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PunicaWrapperBase.batch_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PunicaWrapperBase.is_prefill", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PunicaWrapperBase.no_lora", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 95, "n_typed": 77, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 72, "n_attrs": 7, "n_properties": 5 }, { "kind": "class", "name": "vllm.lora.punica_wrapper.punica_base.PunicaWrapperABC", "methods": [ { "kind": "function", "name": "PunicaWrapperABC.update_metadata", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PunicaWrapperABC.add_shrink", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PunicaWrapperABC.add_expand", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "PunicaWrapperABC.add_lora_embedding", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PunicaWrapperABC.add_lora_linear", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "PunicaWrapperABC.add_lora_logits", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [], "n_typable": 43, "n_typed": 35, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 37, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.lora.punica_wrapper.punica_base", "names": [ "vllm.lora.punica_wrapper.punica_base.PunicaWrapperABC", "vllm.lora.punica_wrapper.punica_base.PunicaWrapperBase" ], "n_typable": 138, "n_typed": 112, "n_any": 0, "n_untyped": 26, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 109, "n_classes": 2, "n_attrs": 7, "n_properties": 5, "n_type_ignores": 0 }, { "path": "vllm/lora/punica_wrapper/punica_selector.py", "symbol_reports": [ { "kind": "function", "name": "vllm.lora.punica_wrapper.punica_selector.get_punica_wrapper", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.lora.punica_wrapper.punica_selector.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.lora.punica_wrapper.punica_selector", "names": [ "vllm.lora.punica_wrapper.punica_selector.get_punica_wrapper", "vllm.lora.punica_wrapper.punica_selector.logger" ], "n_typable": 4, "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/punica_wrapper/punica_cpu.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.punica_wrapper.punica_cpu.PunicaWrapperCPU", "methods": [ { "kind": "function", "name": "PunicaWrapperCPU.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PunicaWrapperCPU._shrink_prefill", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PunicaWrapperCPU._shrink_decode", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PunicaWrapperCPU._expand_prefill", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PunicaWrapperCPU._expand_decode", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PunicaWrapperCPU._expand_slice_prefill", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "PunicaWrapperCPU._expand_slice_decode", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "PunicaWrapperCPU._apply_expand", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "PunicaWrapperCPU._apply_shrink", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PunicaWrapperCPU.add_shrink", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PunicaWrapperCPU.add_expand", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "PunicaWrapperCPU.add_lora_embedding", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PunicaWrapperCPU.add_lora_linear", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "PunicaWrapperCPU.add_lora_logits", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [], "n_typable": 88, "n_typed": 70, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 74, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.lora.punica_wrapper.punica_cpu", "names": [ "vllm.lora.punica_wrapper.punica_cpu.PunicaWrapperCPU" ], "n_typable": 88, "n_typed": 70, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 74, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/punica_wrapper/punica_gpu.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.punica_wrapper.punica_gpu.PunicaWrapperGPU", "methods": [ { "kind": "function", "name": "PunicaWrapperGPU.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PunicaWrapperGPU.update_metadata", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PunicaWrapperGPU.add_shrink", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PunicaWrapperGPU.add_expand", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "PunicaWrapperGPU.add_lora_embedding", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PunicaWrapperGPU.add_lora_linear", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "PunicaWrapperGPU.add_lora_logits", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "PunicaWrapperGPU.moe_lora_align_block_size", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "PunicaWrapperGPU.add_lora_fused_moe", "n_typed": 14, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PunicaWrapperGPU.lora_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PunicaWrapperGPU.max_loras", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PunicaWrapperGPU.token_mapping_meta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PunicaWrapperGPU.prompt_mapping_meta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 80, "n_typed": 60, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 67, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.lora.punica_wrapper.punica_gpu", "names": [ "vllm.lora.punica_wrapper.punica_gpu.PunicaWrapperGPU" ], "n_typable": 80, "n_typed": 60, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 67, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/punica_wrapper/punica_xpu.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.punica_wrapper.punica_xpu.PunicaWrapperXPU", "methods": [ { "kind": "function", "name": "PunicaWrapperXPU.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PunicaWrapperXPU.update_metadata", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PunicaWrapperXPU._get_token_lora_indices", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PunicaWrapperXPU._apply_shrink", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PunicaWrapperXPU._apply_expand", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "PunicaWrapperXPU.add_shrink", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PunicaWrapperXPU.add_expand", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "PunicaWrapperXPU.add_lora_embedding", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PunicaWrapperXPU.add_lora_linear", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "PunicaWrapperXPU.add_lora_logits", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "PunicaWrapperXPU.moe_lora_align_block_size", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "PunicaWrapperXPU.add_lora_fused_moe", "n_typed": 14, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 } ], "properties": [ { "kind": "property", "name": "PunicaWrapperXPU.sampler_indices_padded", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "PunicaWrapperXPU.lora_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PunicaWrapperXPU.max_loras", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PunicaWrapperXPU.token_mapping_meta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 94, "n_typed": 73, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 78, "n_attrs": 3, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.lora.punica_wrapper.punica_xpu", "names": [ "vllm.lora.punica_wrapper.punica_xpu.PunicaWrapperXPU" ], "n_typable": 94, "n_typed": 73, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 78, "n_classes": 1, "n_attrs": 3, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/lora/punica_wrapper/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.lora.punica_wrapper.utils.compute_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.lora.punica_wrapper.utils.convert_mapping", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.lora.punica_wrapper.utils", "names": [ "vllm.lora.punica_wrapper.utils.compute_meta", "vllm.lora.punica_wrapper.utils.convert_mapping" ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/request.py", "symbol_reports": [ { "kind": "class", "name": "vllm.lora.request.LoRARequest", "methods": [ { "kind": "function", "name": "LoRARequest.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoRARequest.__eq__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRARequest.__hash__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "LoRARequest.adapter_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "LoRARequest.name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "LoRARequest.path", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "LoRARequest.lora_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRARequest.lora_int_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRARequest.lora_path", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRARequest.base_model_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRARequest.tensorizer_config_dict", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRARequest.load_inplace", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 13, "n_typed": 9, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 6, "n_properties": 3 } ], "type_ignores": [ { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] } ], "name": "vllm.lora.request", "names": [ "vllm.lora.request.LoRARequest" ], "n_typable": 13, "n_typed": 9, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_classes": 1, "n_attrs": 6, "n_properties": 3, "n_type_ignores": 2 }, { "path": "vllm/lora/resolver.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.lora.resolver.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.lora.resolver.LoRAResolverRegistry", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.lora.resolver.LoRAResolver", "methods": [ { "kind": "function", "name": "LoRAResolver.resolve_lora", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.lora.resolver", "names": [ "vllm.lora.resolver.LoRAResolver", "vllm.lora.resolver.LoRAResolverRegistry", "vllm.lora.resolver.logger" ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.lora.utils.parse_fine_tuned_lora_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.lora.utils.process_packed_modules_mapping", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.lora.utils.get_adapter_absolute_path", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.lora.utils.is_base_embeddding_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.lora.utils.replace_submodule", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.lora.utils.get_captured_lora_counts", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.lora.utils.from_layer", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.lora.utils.is_moe_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.lora.utils.from_layer_logits_processor", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.lora.utils.get_lora_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.lora.utils.get_supported_lora_modules", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.lora.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.lora.utils", "names": [ "vllm.lora.utils.from_layer", "vllm.lora.utils.from_layer_logits_processor", "vllm.lora.utils.get_adapter_absolute_path", "vllm.lora.utils.get_captured_lora_counts", "vllm.lora.utils.get_lora_id", "vllm.lora.utils.get_supported_lora_modules", "vllm.lora.utils.is_base_embeddding_weights", "vllm.lora.utils.is_moe_model", "vllm.lora.utils.logger", "vllm.lora.utils.parse_fine_tuned_lora_name", "vllm.lora.utils.process_packed_modules_mapping", "vllm.lora.utils.replace_submodule" ], "n_typable": 34, "n_typed": 32, "n_any": 0, "n_untyped": 2, "n_functions": 11, "n_function_overloads": 11, "n_function_params": 22, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/lora/worker_manager.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.lora.worker_manager.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.lora.worker_manager.WorkerLoRAManager", "methods": [ { "kind": "function", "name": "WorkerLoRAManager.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "WorkerLoRAManager.dummy_lora_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerLoRAManager.create_lora_manager", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WorkerLoRAManager._load_adapter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerLoRAManager.add_dummy_lora", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WorkerLoRAManager.pin_adapter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerLoRAManager.set_active_adapters", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WorkerLoRAManager.supports_tower_connector_lora", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerLoRAManager._apply_adapters", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerLoRAManager.add_adapter", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerLoRAManager.remove_adapter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerLoRAManager.remove_all_adapters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerLoRAManager.list_adapters", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "WorkerLoRAManager.is_enabled", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "WorkerLoRAManager._manager_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "WorkerLoRAManager.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerLoRAManager.max_num_seqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerLoRAManager.max_num_batched_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerLoRAManager.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerLoRAManager.lora_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerLoRAManager.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerLoRAManager.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 37, "n_typed": 25, "n_any": 2, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 15, "n_attrs": 8, "n_properties": 1 }, { "kind": "class", "name": "vllm.lora.worker_manager.LRUCacheWorkerLoRAManager", "methods": [ { "kind": "function", "name": "LRUCacheWorkerLoRAManager.create_lora_manager", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LRUCacheWorkerLoRAManager._apply_adapters", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUCacheWorkerLoRAManager.add_adapter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LRUCacheWorkerLoRAManager._manager_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 8, "n_typed": 7, "n_any": 1, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.lora.worker_manager", "names": [ "vllm.lora.worker_manager.LRUCacheWorkerLoRAManager", "vllm.lora.worker_manager.WorkerLoRAManager", "vllm.lora.worker_manager.logger" ], "n_typable": 46, "n_typed": 32, "n_any": 3, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 19, "n_classes": 2, "n_attrs": 10, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/parameter.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.parameter.PackedvLLMParameter", "methods": [ { "kind": "function", "name": "PackedvLLMParameter.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PackedvLLMParameter.adjust_shard_indexes_for_packing", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "PackedvLLMParameter.packed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "PackedvLLMParameter.packed_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "PackedvLLMParameter.marlin_tile_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [], "n_typable": 11, "n_typed": 3, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 0, "n_properties": 3 }, { "kind": "class", "name": "vllm.model_executor.parameter.BasevLLMParameter", "methods": [ { "kind": "function", "name": "BasevLLMParameter.__new__", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BasevLLMParameter.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BasevLLMParameter._is_1d_and_scalar", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BasevLLMParameter._assert_and_load", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BasevLLMParameter.load_column_parallel_weight", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BasevLLMParameter.load_row_parallel_weight", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BasevLLMParameter.load_merged_column_weight", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BasevLLMParameter.load_qkv_weight", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BasevLLMParameter._shard_id_as_int", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BasevLLMParameter.__torch_function__", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "BasevLLMParameter.weight_loader", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_typable": 2 } ], "attrs": [ { "kind": "attr", "name": "BasevLLMParameter.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BasevLLMParameter.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 13, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 17, "n_attrs": 2, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.parameter.ModelWeightParameter", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.parameter.ChannelQuantScaleParameter", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.parameter.PerTensorScaleParameter", "methods": [ { "kind": "function", "name": "PerTensorScaleParameter.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PerTensorScaleParameter.load_row_parallel_weight", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PerTensorScaleParameter.load_merged_column_weight", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PerTensorScaleParameter.load_qkv_weight", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PerTensorScaleParameter.load_column_parallel_weight", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PerTensorScaleParameter._load_into_shard_id", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 18, "n_typed": 2, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.parameter.PackedColumnParameter", "methods": [ { "kind": "function", "name": "PackedColumnParameter.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PackedColumnParameter.adjust_shard_indexes_for_packing", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "PackedColumnParameter.packed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "PackedColumnParameter.packed_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "PackedColumnParameter.marlin_tile_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [], "n_typable": 11, "n_typed": 3, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 0, "n_properties": 3 }, { "kind": "class", "name": "vllm.model_executor.parameter.RowvLLMParameter", "methods": [ { "kind": "function", "name": "RowvLLMParameter.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RowvLLMParameter.load_row_parallel_weight", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "RowvLLMParameter.input_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [], "n_typable": 6, "n_typed": 2, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.parameter.GroupQuantScaleParameter", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.parameter", "names": [ "vllm.model_executor.parameter.BasevLLMParameter", "vllm.model_executor.parameter.ChannelQuantScaleParameter", "vllm.model_executor.parameter.GroupQuantScaleParameter", "vllm.model_executor.parameter.ModelWeightParameter", "vllm.model_executor.parameter.PackedColumnParameter", "vllm.model_executor.parameter.PackedvLLMParameter", "vllm.model_executor.parameter.PerTensorScaleParameter", "vllm.model_executor.parameter.RowvLLMParameter" ], "n_typable": 77, "n_typed": 23, "n_any": 0, "n_untyped": 54, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 22, "n_method_overloads": 22, "n_method_params": 44, "n_classes": 8, "n_attrs": 2, "n_properties": 8, "n_type_ignores": 0 }, { "path": "vllm/model_executor/custom_op.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.custom_op.CustomOp", "methods": [ { "kind": "function", "name": "CustomOp.__new__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CustomOp.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CustomOp.forward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CustomOp.forward_native", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CustomOp.forward_cuda", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CustomOp.forward_hip", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CustomOp.forward_xpu", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CustomOp.forward_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CustomOp.forward_tpu", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CustomOp.forward_oot", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CustomOp.dispatch_forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CustomOp.maybe_compile", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CustomOp.enabled", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CustomOp.default_on", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CustomOp.register", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CustomOp.register_oot", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 43, "n_typed": 9, "n_any": 0, "n_untyped": 34, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 27, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.custom_op.PluggableLayer", "methods": [ { "kind": "function", "name": "PluggableLayer.__new__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PluggableLayer.register", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PluggableLayer.register_oot", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 2, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.custom_op.op_registry_oot", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.custom_op.op_registry", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.custom_op.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.custom_op", "names": [ "vllm.model_executor.custom_op.CustomOp", "vllm.model_executor.custom_op.PluggableLayer", "vllm.model_executor.custom_op.logger", "vllm.model_executor.custom_op.op_registry", "vllm.model_executor.custom_op.op_registry_oot" ], "n_typable": 54, "n_typed": 13, "n_any": 0, "n_untyped": 41, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 32, "n_classes": 2, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/mixed_precision/marlin.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.mixed_precision.marlin.MarlinLinearKernel", "methods": [ { "kind": "function", "name": "MarlinLinearKernel.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MarlinLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MarlinLinearKernel.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MarlinLinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.mixed_precision.marlin", "names": [ "vllm.model_executor.kernels.linear.mixed_precision.marlin.MarlinLinearKernel" ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/scaled_mm/pytorch.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.pytorch.RowWiseTorchFP8ScaledMMLinearKernel", "methods": [ { "kind": "function", "name": "RowWiseTorchFP8ScaledMMLinearKernel.is_supported", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RowWiseTorchFP8ScaledMMLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RowWiseTorchFP8ScaledMMLinearKernel.apply_scaled_mm", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.pytorch.PerTensorTorchFP8ScaledMMLinearKernel", "methods": [ { "kind": "function", "name": "PerTensorTorchFP8ScaledMMLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PerTensorTorchFP8ScaledMMLinearKernel.apply_scaled_mm", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.pytorch.ChannelWiseTorchFP8ScaledMMLinearKernel", "methods": [ { "kind": "function", "name": "ChannelWiseTorchFP8ScaledMMLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChannelWiseTorchFP8ScaledMMLinearKernel.apply_scaled_mm", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.pytorch.TorchFP8ScaledMMLinearKernel", "methods": [ { "kind": "function", "name": "TorchFP8ScaledMMLinearKernel.is_supported", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TorchFP8ScaledMMLinearKernel.get_output_padding", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.scaled_mm.pytorch", "names": [ "vllm.model_executor.kernels.linear.scaled_mm.pytorch.ChannelWiseTorchFP8ScaledMMLinearKernel", "vllm.model_executor.kernels.linear.scaled_mm.pytorch.PerTensorTorchFP8ScaledMMLinearKernel", "vllm.model_executor.kernels.linear.scaled_mm.pytorch.RowWiseTorchFP8ScaledMMLinearKernel", "vllm.model_executor.kernels.linear.scaled_mm.pytorch.TorchFP8ScaledMMLinearKernel" ], "n_typable": 35, "n_typed": 35, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 26, "n_classes": 4, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/mixed_precision/dynamic_4bit.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.mixed_precision.dynamic_4bit.Dynamic4bitLinearKernel", "methods": [ { "kind": "function", "name": "Dynamic4bitLinearKernel.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Dynamic4bitLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Dynamic4bitLinearKernel.process_weights_after_loading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Dynamic4bitLinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Dynamic4bitLinearKernel.SUPPORTED_QUANT_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.mixed_precision.dynamic_4bit", "names": [ "vllm.model_executor.kernels.linear.mixed_precision.dynamic_4bit.Dynamic4bitLinearKernel" ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/__init__.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.kernels.linear.init_int8_linear_kernel", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.kernels.linear.init_fp8_linear_kernel", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.kernels.linear.choose_mp_linear_kernel", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear", "names": [ "vllm.model_executor.kernels.linear.choose_mp_linear_kernel", "vllm.model_executor.kernels.linear.init_fp8_linear_kernel", "vllm.model_executor.kernels.linear.init_int8_linear_kernel" ], "n_typable": 14, "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 11, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/scaled_mm/rocm.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.rocm.ROCmFP8ScaledMMLinearKernel", "methods": [ { "kind": "function", "name": "ROCmFP8ScaledMMLinearKernel.is_supported", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ROCmFP8ScaledMMLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ROCmFP8ScaledMMLinearKernel.apply_scaled_mm", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.kernels.linear.scaled_mm.rocm.rocm_per_tensor_float_w8a8_scaled_mm_fake", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.kernels.linear.scaled_mm.rocm.rocm_per_tensor_float_w8a8_scaled_mm_impl", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.scaled_mm.rocm", "names": [ "vllm.model_executor.kernels.linear.scaled_mm.rocm.ROCmFP8ScaledMMLinearKernel", "vllm.model_executor.kernels.linear.scaled_mm.rocm.rocm_per_tensor_float_w8a8_scaled_mm_fake", "vllm.model_executor.kernels.linear.scaled_mm.rocm.rocm_per_tensor_float_w8a8_scaled_mm_impl" ], "n_typable": 26, "n_typed": 26, "n_any": 0, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 12, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/scaled_mm/ScaledMMLinearKernel.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.ScaledMMLinearKernel.Int8ScaledMMLinearKernel", "methods": [ { "kind": "function", "name": "Int8ScaledMMLinearKernel._get_layer_params", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.ScaledMMLinearKernel.FP8ScaledMMLinearKernel", "methods": [ { "kind": "function", "name": "FP8ScaledMMLinearKernel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FP8ScaledMMLinearKernel.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FP8ScaledMMLinearKernel._get_layer_params", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FP8ScaledMMLinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FP8ScaledMMLinearKernel.apply_scaled_mm", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "FP8ScaledMMLinearKernel.get_output_padding", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FP8ScaledMMLinearKernel.quant_fp8", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FP8ScaledMMLinearKernel.fp8_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 19, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.ScaledMMLinearKernel.FP8ScaledMMLinearLayerConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FP8ScaledMMLinearLayerConfig.weight_quant_key", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FP8ScaledMMLinearLayerConfig.activation_quant_key", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FP8ScaledMMLinearLayerConfig.out_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.ScaledMMLinearKernel.ScaledMMLinearLayerConfig", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.ScaledMMLinearKernel.ScaledMMLinearKernel", "methods": [ { "kind": "function", "name": "ScaledMMLinearKernel.is_supported", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ScaledMMLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ScaledMMLinearKernel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ScaledMMLinearKernel.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ScaledMMLinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ScaledMMLinearKernel._get_layer_params", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ScaledMMLinearKernel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ScaledMMLinearKernel.layer_param_names", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 14, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.ScaledMMLinearKernel.Int8ScaledMMLinearLayerConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Int8ScaledMMLinearLayerConfig.is_static_input_scheme", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Int8ScaledMMLinearLayerConfig.is_channelwise", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Int8ScaledMMLinearLayerConfig.input_symmetric", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.scaled_mm.ScaledMMLinearKernel", "names": [ "vllm.model_executor.kernels.linear.scaled_mm.ScaledMMLinearKernel.FP8ScaledMMLinearKernel", "vllm.model_executor.kernels.linear.scaled_mm.ScaledMMLinearKernel.FP8ScaledMMLinearLayerConfig", "vllm.model_executor.kernels.linear.scaled_mm.ScaledMMLinearKernel.Int8ScaledMMLinearKernel", "vllm.model_executor.kernels.linear.scaled_mm.ScaledMMLinearKernel.Int8ScaledMMLinearLayerConfig", "vllm.model_executor.kernels.linear.scaled_mm.ScaledMMLinearKernel.ScaledMMLinearKernel", "vllm.model_executor.kernels.linear.scaled_mm.ScaledMMLinearKernel.ScaledMMLinearLayerConfig" ], "n_typable": 41, "n_typed": 34, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 24, "n_classes": 6, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/mixed_precision/machete.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.mixed_precision.machete.MacheteLinearKernel", "methods": [ { "kind": "function", "name": "MacheteLinearKernel.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MacheteLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MacheteLinearKernel.process_weights_after_loading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MacheteLinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.mixed_precision.machete", "names": [ "vllm.model_executor.kernels.linear.mixed_precision.machete.MacheteLinearKernel" ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/mixed_precision/exllama.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.mixed_precision.exllama.ExllamaLinearKernel", "methods": [ { "kind": "function", "name": "ExllamaLinearKernel.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ExllamaLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExllamaLinearKernel.process_weights_after_loading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExllamaLinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExllamaLinearKernel.SUPPORTED_QUANT_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.mixed_precision.exllama", "names": [ "vllm.model_executor.kernels.linear.mixed_precision.exllama.ExllamaLinearKernel" ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/scaled_mm/triton.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.triton.TritonInt8ScaledMMLinearKernel", "methods": [ { "kind": "function", "name": "TritonInt8ScaledMMLinearKernel.is_supported", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TritonInt8ScaledMMLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TritonInt8ScaledMMLinearKernel.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TritonInt8ScaledMMLinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.scaled_mm.triton", "names": [ "vllm.model_executor.kernels.linear.scaled_mm.triton.TritonInt8ScaledMMLinearKernel" ], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/scaled_mm/flashinfer.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.flashinfer.FlashInferFP8ScaledMMLinearKernel", "methods": [ { "kind": "function", "name": "FlashInferFP8ScaledMMLinearKernel.is_supported", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferFP8ScaledMMLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferFP8ScaledMMLinearKernel.apply_scaled_mm", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.scaled_mm.flashinfer", "names": [ "vllm.model_executor.kernels.linear.scaled_mm.flashinfer.FlashInferFP8ScaledMMLinearKernel" ], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/mixed_precision/cpu.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.mixed_precision.cpu.CPUWNA16LinearKernel", "methods": [ { "kind": "function", "name": "CPUWNA16LinearKernel.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUWNA16LinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUWNA16LinearKernel._process_gptq_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUWNA16LinearKernel.process_weights_after_loading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUWNA16LinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.mixed_precision.cpu", "names": [ "vllm.model_executor.kernels.linear.mixed_precision.cpu.CPUWNA16LinearKernel" ], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/scaled_mm/cutlass.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.cutlass.CutlassInt8ScaledMMLinearKernel", "methods": [ { "kind": "function", "name": "CutlassInt8ScaledMMLinearKernel.is_supported", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassInt8ScaledMMLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassInt8ScaledMMLinearKernel.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassInt8ScaledMMLinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.cutlass.CutlassFP8ScaledMMLinearKernel", "methods": [ { "kind": "function", "name": "CutlassFP8ScaledMMLinearKernel.is_supported", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassFP8ScaledMMLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassFP8ScaledMMLinearKernel.apply_scaled_mm", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.scaled_mm.cutlass", "names": [ "vllm.model_executor.kernels.linear.scaled_mm.cutlass.CutlassFP8ScaledMMLinearKernel", "vllm.model_executor.kernels.linear.scaled_mm.cutlass.CutlassInt8ScaledMMLinearKernel" ], "n_typable": 22, "n_typed": 22, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 15, "n_classes": 2, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/scaled_mm/aiter.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.aiter.AiterInt8ScaledMMLinearKernel", "methods": [ { "kind": "function", "name": "AiterInt8ScaledMMLinearKernel.is_supported", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AiterInt8ScaledMMLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AiterInt8ScaledMMLinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.scaled_mm.aiter", "names": [ "vllm.model_executor.kernels.linear.scaled_mm.aiter.AiterInt8ScaledMMLinearKernel" ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/mixed_precision/conch.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.mixed_precision.conch.ConchLinearKernel", "methods": [ { "kind": "function", "name": "ConchLinearKernel.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConchLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConchLinearKernel.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConchLinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.mixed_precision.conch", "names": [ "vllm.model_executor.kernels.linear.mixed_precision.conch.ConchLinearKernel" ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/mixed_precision/cutlass.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.mixed_precision.cutlass.CutlassW4A8LinearKernel", "methods": [ { "kind": "function", "name": "CutlassW4A8LinearKernel.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CutlassW4A8LinearKernel.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassW4A8LinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassW4A8LinearKernel.process_weights_after_loading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassW4A8LinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CutlassW4A8LinearKernel.quant_fp8", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 7, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.mixed_precision.cutlass", "names": [ "vllm.model_executor.kernels.linear.mixed_precision.cutlass.CutlassW4A8LinearKernel" ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 7, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/mixed_precision/MPLinearKernel.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.mixed_precision.MPLinearKernel.MPLinearLayerConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MPLinearLayerConfig.full_weight_shape", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MPLinearLayerConfig.partition_weight_shape", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MPLinearLayerConfig.weight_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MPLinearLayerConfig.act_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MPLinearLayerConfig.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MPLinearLayerConfig.zero_points", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MPLinearLayerConfig.has_g_idx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MPLinearLayerConfig.out_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.kernels.linear.mixed_precision.MPLinearKernel.MPLinearKernel", "methods": [ { "kind": "function", "name": "MPLinearKernel.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MPLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MPLinearKernel.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MPLinearKernel.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MPLinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MPLinearKernel._transform_param", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MPLinearKernel._get_weight_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MPLinearKernel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPLinearKernel.w_q_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPLinearKernel.w_s_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPLinearKernel.w_zp_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPLinearKernel.w_gidx_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 21, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 14, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.mixed_precision.MPLinearKernel", "names": [ "vllm.model_executor.kernels.linear.mixed_precision.MPLinearKernel.MPLinearKernel", "vllm.model_executor.kernels.linear.mixed_precision.MPLinearKernel.MPLinearLayerConfig" ], "n_typable": 26, "n_typed": 21, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 14, "n_classes": 2, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/mixed_precision/allspark.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.mixed_precision.allspark.AllSparkLinearKernel", "methods": [ { "kind": "function", "name": "AllSparkLinearKernel.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AllSparkLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AllSparkLinearKernel.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AllSparkLinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.mixed_precision.allspark", "names": [ "vllm.model_executor.kernels.linear.mixed_precision.allspark.AllSparkLinearKernel" ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/scaled_mm/cpu.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.cpu.CPUInt8ScaledMMLinearKernel", "methods": [ { "kind": "function", "name": "CPUInt8ScaledMMLinearKernel.is_supported", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUInt8ScaledMMLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUInt8ScaledMMLinearKernel.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUInt8ScaledMMLinearKernel.process_weights_for_onednn", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUInt8ScaledMMLinearKernel.process_weights_for_sgl", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUInt8ScaledMMLinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CPUInt8ScaledMMLinearKernel._apply_weights_onednn", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CPUInt8ScaledMMLinearKernel._apply_weights_sgl", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 22, "n_typed": 22, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 14, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.scaled_mm.cpu", "names": [ "vllm.model_executor.kernels.linear.scaled_mm.cpu.CPUInt8ScaledMMLinearKernel" ], "n_typable": 22, "n_typed": 22, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 14, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/mixed_precision/xpu.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.mixed_precision.xpu.XPUwNa16LinearKernel", "methods": [ { "kind": "function", "name": "XPUwNa16LinearKernel.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUwNa16LinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XPUwNa16LinearKernel.process_weights_after_loading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XPUwNa16LinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.mixed_precision.xpu", "names": [ "vllm.model_executor.kernels.linear.mixed_precision.xpu.XPUwNa16LinearKernel" ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/kernels/linear/scaled_mm/xpu.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.kernels.linear.scaled_mm.xpu.XPUFP8ScaledMMLinearKernel", "methods": [ { "kind": "function", "name": "XPUFP8ScaledMMLinearKernel.is_supported", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XPUFP8ScaledMMLinearKernel.can_implement", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XPUFP8ScaledMMLinearKernel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "XPUFP8ScaledMMLinearKernel.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "XPUFP8ScaledMMLinearKernel.apply_scaled_mm", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "XPUFP8ScaledMMLinearKernel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "XPUFP8ScaledMMLinearKernel.layer_param_names", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 19, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 14, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.kernels.linear.scaled_mm.xpu", "names": [ "vllm.model_executor.kernels.linear.scaled_mm.xpu.XPUFP8ScaledMMLinearKernel" ], "n_typable": 21, "n_typed": 19, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 14, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/activation.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.activation.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.activation.SiluAndMul", "methods": [ { "kind": "function", "name": "SiluAndMul.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SiluAndMul.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SiluAndMul.forward_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SiluAndMul.forward_xpu", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiluAndMul.op", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.activation.swiglustep_and_mul_triton", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.layers.activation.SwigluOAIAndMul", "methods": [ { "kind": "function", "name": "SwigluOAIAndMul.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SwigluOAIAndMul.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SwigluOAIAndMul.forward_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SwigluOAIAndMul.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SwigluOAIAndMul.alpha", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SwigluOAIAndMul.limit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 7, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.activation.QuickGELU", "methods": [ { "kind": "function", "name": "QuickGELU.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QuickGELU.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuickGELU.forward_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuickGELU.forward_xpu", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QuickGELU.op", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.activation.FastGELU", "methods": [ { "kind": "function", "name": "FastGELU.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FastGELU.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FastGELU.forward_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FastGELU.forward_xpu", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FastGELU.op", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.activation.GeluAndMul", "methods": [ { "kind": "function", "name": "GeluAndMul.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GeluAndMul.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GeluAndMul.forward_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GeluAndMul.forward_xpu", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GeluAndMul.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GeluAndMul.approximate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GeluAndMul.op", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.activation.SwigluStepAndMul", "methods": [ { "kind": "function", "name": "SwigluStepAndMul.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SwigluStepAndMul.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SwigluStepAndMul.forward_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SwigluStepAndMul.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SwigluStepAndMul.limit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.activation.ScaledActivation", "methods": [ { "kind": "function", "name": "ScaledActivation.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ScaledActivation.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ScaledActivation.weight_loader", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ScaledActivation.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ScaledActivation.input_is_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ScaledActivation.scales", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.activation.get_act_and_mul_fn", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.activation.MulAndSilu", "methods": [ { "kind": "function", "name": "MulAndSilu.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MulAndSilu.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MulAndSilu.forward_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MulAndSilu.forward_xpu", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MulAndSilu.op", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.activation.NewGELU", "methods": [ { "kind": "function", "name": "NewGELU.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NewGELU.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NewGELU.forward_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NewGELU.forward_xpu", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NewGELU.op", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.activation.GeluAndMulSparse", "methods": [ { "kind": "function", "name": "GeluAndMulSparse.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GeluAndMulSparse._gaussian_topk", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GeluAndMulSparse.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GeluAndMulSparse.forward_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GeluAndMulSparse.approximate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GeluAndMulSparse.std_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.activation.ReLUSquaredActivation", "methods": [ { "kind": "function", "name": "ReLUSquaredActivation.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ReLUSquaredActivation.forward_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.activation.FatreluAndMul", "methods": [ { "kind": "function", "name": "FatreluAndMul.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FatreluAndMul.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FatreluAndMul.forward_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FatreluAndMul.threshold", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FatreluAndMul.op", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.activation.XIELU", "methods": [ { "kind": "function", "name": "XIELU.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "XIELU._xielu_python", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XIELU._xielu_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XIELU.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XIELU.forward_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "XIELU.alpha_p", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "XIELU.alpha_n", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "XIELU.with_vector_loads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 14, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.activation.get_act_fn", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.activation", "names": [ "vllm.model_executor.layers.activation.FastGELU", "vllm.model_executor.layers.activation.FatreluAndMul", "vllm.model_executor.layers.activation.GeluAndMul", "vllm.model_executor.layers.activation.GeluAndMulSparse", "vllm.model_executor.layers.activation.MulAndSilu", "vllm.model_executor.layers.activation.NewGELU", "vllm.model_executor.layers.activation.QuickGELU", "vllm.model_executor.layers.activation.ReLUSquaredActivation", "vllm.model_executor.layers.activation.ScaledActivation", "vllm.model_executor.layers.activation.SiluAndMul", "vllm.model_executor.layers.activation.SwigluOAIAndMul", "vllm.model_executor.layers.activation.SwigluStepAndMul", "vllm.model_executor.layers.activation.XIELU", "vllm.model_executor.layers.activation.get_act_and_mul_fn", "vllm.model_executor.layers.activation.get_act_fn", "vllm.model_executor.layers.activation.logger", "vllm.model_executor.layers.activation.swiglustep_and_mul_triton" ], "n_typable": 133, "n_typed": 98, "n_any": 0, "n_untyped": 35, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 5, "n_methods": 50, "n_method_overloads": 50, "n_method_params": 54, "n_classes": 13, "n_attrs": 21, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/attention/mm_encoder_attention.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.attention.mm_encoder_attention.MMEncoderAttention", "methods": [ { "kind": "function", "name": "MMEncoderAttention.compute_max_seqlen", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MMEncoderAttention.maybe_compute_sequence_lengths", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MMEncoderAttention.maybe_recompute_cu_seqlens", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MMEncoderAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MMEncoderAttention.enabled", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MMEncoderAttention.view_qkv_to_4d", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MMEncoderAttention._forward_sdpa", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MMEncoderAttention._forward_fa", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MMEncoderAttention._forward_triton", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MMEncoderAttention._forward_flashinfer", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MMEncoderAttention.forward_native", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MMEncoderAttention.forward_cuda", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MMEncoderAttention.forward_cpu", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MMEncoderAttention.forward_xpu", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MMEncoderAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MMEncoderAttention.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MMEncoderAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MMEncoderAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MMEncoderAttention.layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MMEncoderAttention.num_queries_per_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MMEncoderAttention.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MMEncoderAttention.is_flash_attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 85, "n_typed": 77, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 63, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.attention.mm_encoder_attention.FLASHINFER_BATCH_BUCKETS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mm_encoder_attention.add_padding_to_seqlens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mm_encoder_attention.bucket_flashinfer_max_seqlen", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.attention.mm_encoder_attention.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.attention.mm_encoder_attention.FLASHINFER_CUDNN_WORKSPACE_SIZE_BYTES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.attention.mm_encoder_attention.FLASHINFER_MAX_SEQLEN_BUCKETS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.attention.mm_encoder_attention", "names": [ "vllm.model_executor.layers.attention.mm_encoder_attention.FLASHINFER_BATCH_BUCKETS", "vllm.model_executor.layers.attention.mm_encoder_attention.FLASHINFER_CUDNN_WORKSPACE_SIZE_BYTES", "vllm.model_executor.layers.attention.mm_encoder_attention.FLASHINFER_MAX_SEQLEN_BUCKETS", "vllm.model_executor.layers.attention.mm_encoder_attention.MMEncoderAttention", "vllm.model_executor.layers.attention.mm_encoder_attention.add_padding_to_seqlens", "vllm.model_executor.layers.attention.mm_encoder_attention.bucket_flashinfer_max_seqlen", "vllm.model_executor.layers.attention.mm_encoder_attention.logger" ], "n_typable": 92, "n_typed": 83, "n_any": 0, "n_untyped": 9, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 4, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 63, "n_classes": 1, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/attention/attention.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.attention.attention.Attention", "methods": [ { "kind": "function", "name": "Attention.__init__", "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "Attention.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Attention.calc_kv_scales", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Attention.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Attention.process_weights_after_loading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Attention.get_attn_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Attention.get_kv_cache_spec", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Attention.kv_cache_torch_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.calculate_kv_scales", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.head_size_v", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.has_sink", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.use_mm_prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.use_alibi_sqrt", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.impl", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.use_direct_call", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.use_output", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.attn_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.kv_sharing_target_layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.kv_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.query_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 55, "n_typed": 26, "n_any": 0, "n_untyped": 29, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 25, "n_attrs": 23, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.attention.get_attention_context", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.attention.unified_attention_fake", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.attention.maybe_calc_kv_scales", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.attention.validate_kv_sharing_target", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.attention.maybe_calc_kv_scales_fake", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.attention.set_default_quant_scales", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.attention.unified_kv_cache_update", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.attention.unified_attention", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.attention.unified_attention_with_output", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.attention.unified_kv_cache_update_fake", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.attention.should_load_quant_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.attention.attention.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.attention.unified_attention_with_output_fake", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "type_ignores": [], "name": "vllm.model_executor.layers.attention.attention", "names": [ "vllm.model_executor.layers.attention.attention.Attention", "vllm.model_executor.layers.attention.attention.get_attention_context", "vllm.model_executor.layers.attention.attention.logger", "vllm.model_executor.layers.attention.attention.maybe_calc_kv_scales", "vllm.model_executor.layers.attention.attention.maybe_calc_kv_scales_fake", "vllm.model_executor.layers.attention.attention.set_default_quant_scales", "vllm.model_executor.layers.attention.attention.should_load_quant_weights", "vllm.model_executor.layers.attention.attention.unified_attention", "vllm.model_executor.layers.attention.attention.unified_attention_fake", "vllm.model_executor.layers.attention.attention.unified_attention_with_output", "vllm.model_executor.layers.attention.attention.unified_attention_with_output_fake", "vllm.model_executor.layers.attention.attention.unified_kv_cache_update", "vllm.model_executor.layers.attention.attention.unified_kv_cache_update_fake", "vllm.model_executor.layers.attention.attention.validate_kv_sharing_target" ], "n_typable": 113, "n_typed": 79, "n_any": 0, "n_untyped": 34, "n_functions": 12, "n_function_overloads": 12, "n_function_params": 45, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 25, "n_classes": 1, "n_attrs": 24, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/attention/encoder_only_attention.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.attention.encoder_only_attention.EncoderOnlyAttention", "methods": [ { "kind": "function", "name": "EncoderOnlyAttention.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "EncoderOnlyAttention.get_kv_cache_spec", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.encoder_only_attention.create_encoder_only_attention_backend", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.attention.encoder_only_attention", "names": [ "vllm.model_executor.layers.attention.encoder_only_attention.EncoderOnlyAttention", "vllm.model_executor.layers.attention.encoder_only_attention.create_encoder_only_attention_backend" ], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/attention/chunked_local_attention.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.attention.chunked_local_attention.ChunkedLocalAttention", "methods": [ { "kind": "function", "name": "ChunkedLocalAttention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "ChunkedLocalAttention.get_kv_cache_spec", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChunkedLocalAttention.attention_chunk_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 12, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.chunked_local_attention.create_chunked_local_attention_backend", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.layers.attention.chunked_local_attention", "names": [ "vllm.model_executor.layers.attention.chunked_local_attention.ChunkedLocalAttention", "vllm.model_executor.layers.attention.chunked_local_attention.create_chunked_local_attention_backend" ], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/attention/cross_attention.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.attention.cross_attention.CrossAttention", "methods": [ { "kind": "function", "name": "CrossAttention.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CrossAttention.get_kv_cache_spec", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.attention.cross_attention.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.cross_attention.create_cross_attention_backend", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.attention.cross_attention", "names": [ "vllm.model_executor.layers.attention.cross_attention.CrossAttention", "vllm.model_executor.layers.attention.cross_attention.create_cross_attention_backend", "vllm.model_executor.layers.attention.cross_attention.logger" ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/attention/mla_attention.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.attention.mla_attention.MLAAttention", "methods": [ { "kind": "function", "name": "MLAAttention.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "MLAAttention.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MLAAttention.forward_impl", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "MLAAttention.process_weights_after_loading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MLAAttention.calc_kv_scales", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MLAAttention.get_attn_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MLAAttention.get_kv_cache_spec", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MLAAttention._v_up_proj", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MLAAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.qk_nope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.qk_rope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.kv_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.kv_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.indexer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.qk_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.calculate_kv_scales", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.impl", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.q_pad_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.use_direct_call", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.kv_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.use_sparse", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.q_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.k_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.v_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.is_aiter_triton_fp8_bmm_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.is_aiter_triton_fp4_bmm_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLAAttention.chunked_prefill_workspace_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 69, "n_typed": 37, "n_any": 0, "n_untyped": 32, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 33, "n_attrs": 28, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.attention.mla_attention.FlashInferPrefillMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferPrefillMetadata.prefill_main", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferPrefillMetadata.prefill_chunks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.attention.mla_attention.flash_attn_varlen_func", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.attention.mla_attention.is_vllm_fa", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.attention.mla_attention.CUDNN_WORKSPACE_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mla_attention.use_cudnn_prefill", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.attention.mla_attention.QueryLenSupport", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "QueryLenSupport.SINGLE_ONLY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QueryLenSupport.UNIFORM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QueryLenSupport.VARLEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.attention.mla_attention.MLADims", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MLADims.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLADims.kv_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLADims.qk_nope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLADims.qk_rope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLADims.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.attention.mla_attention.D", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.attention.mla_attention.MLACommonImpl", "methods": [ { "kind": "function", "name": "MLACommonImpl.__init__", "n_typed": 20, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 20, "n_params": 19, "n_function_overloads": 1, "n_function_params": 19 }, { "kind": "function", "name": "MLACommonImpl._flash_attn_varlen_diff_headdims", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MLACommonImpl._run_prefill_new_tokens_fa", "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MLACommonImpl._run_prefill_new_tokens_fi", "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MLACommonImpl._run_prefill_new_tokens_cudnn", "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MLACommonImpl._run_prefill_context_chunk_fa", "n_typed": 2, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MLACommonImpl._run_prefill_context_chunk_fi", "n_typed": 2, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MLACommonImpl._run_prefill_context_chunk_cudnn", "n_typed": 2, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MLACommonImpl._run_prefill_new_tokens_trtllm_ragged", "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MLACommonImpl._run_prefill_context_chunk_trtllm_ragged", "n_typed": 2, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MLACommonImpl._concat_k_nope_k_pe", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MLACommonImpl._compute_prefill_context", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MLACommonImpl._context_parallel_compute_prefill_context", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MLACommonImpl.forward_mha", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "MLACommonImpl.forward_mqa", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MLACommonImpl.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.kv_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.qk_nope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.qk_rope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.qk_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.kv_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.indexer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.q_pad_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.supports_quant_query_input", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.dcp_world_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.cp_kv_cache_interleave_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.flash_attn_varlen_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonImpl.vllm_flash_attn_version", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 121, "n_typed": 59, "n_any": 0, "n_untyped": 62, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 87, "n_attrs": 19, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mla_attention.use_flashinfer_prefill", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.attention.mla_attention.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mla_attention.unified_mla_attention_with_output", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mla_attention.is_deepseek_r1_mla_compatible", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mla_attention.unified_mla_attention_fake", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mla_attention.unified_mla_kv_cache_update", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.layers.attention.mla_attention.MLACommonMetadata", "methods": [ { "kind": "function", "name": "MLACommonMetadata.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MLACommonMetadata.num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonMetadata.num_actual_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonMetadata.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonMetadata.num_decodes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonMetadata.num_decode_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonMetadata.num_prefills", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonMetadata.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonMetadata.decode", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonMetadata.prefill", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 12, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mla_attention.unified_mla_attention_with_output_fake", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mla_attention.unified_mla_kv_cache_update_fake", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mla_attention.get_mla_dims", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mla_attention.backend_supports_prefill_query_quantization", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.attention.mla_attention.MLACommonBackend", "methods": [ { "kind": "function", "name": "MLACommonBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MLACommonBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MLACommonBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MLACommonBackend.get_kv_cache_stride_order", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MLACommonBackend.get_supported_head_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MLACommonBackend.is_mla", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MLACommonBackend.accept_output_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 13, "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.attention.mla_attention.M", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.attention.mla_attention.MLACommonDecodeMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MLACommonDecodeMetadata.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonDecodeMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonDecodeMetadata.dcp_tot_seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.attention.mla_attention.MLACommonMetadataBuilder", "methods": [ { "kind": "function", "name": "MLACommonMetadataBuilder.determine_chunked_prefill_workspace_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MLACommonMetadataBuilder.determine_prefill_query_data_type", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MLACommonMetadataBuilder.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MLACommonMetadataBuilder._build_fi_prefill_wrappers", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MLACommonMetadataBuilder._build_decode", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "MLACommonMetadataBuilder.build_for_cudagraph_capture", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MLACommonMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MLACommonMetadataBuilder.query_len_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.reorder_batch_threshold", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.metadata_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.kv_cache_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.mla_dims", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.aot_schedule", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.q_data_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.dcp_local_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.dcp_virtual_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.cp_kv_cache_interleave_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.chunked_prefill_workspace_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.prefill_metadata_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.dcp_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.dcp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.page_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.chunked_prefill_workspace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLACommonMetadataBuilder.cudnn_workspace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 50, "n_typed": 28, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 21, "n_attrs": 22, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mla_attention.use_trtllm_ragged_deepseek_prefill", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.attention.mla_attention.MLACommonPrefillMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MLACommonPrefillMetadata.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonPrefillMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonPrefillMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonPrefillMetadata.chunked_context", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonPrefillMetadata.query_seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonPrefillMetadata.workspace_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonPrefillMetadata.q_data_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLACommonPrefillMetadata.output_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.attention.mla_attention.A", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mla_attention.dynamic_per_batched_tensor_quant", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.layers.attention.mla_attention.CudnnPrefillMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CudnnPrefillMetadata.cudnn_workspace", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mla_attention.unified_mla_attention", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.layers.attention.mla_attention.ChunkedContextMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChunkedContextMetadata.cu_seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChunkedContextMetadata.starts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChunkedContextMetadata.seq_tot", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChunkedContextMetadata.max_seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChunkedContextMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChunkedContextMetadata.workspace", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChunkedContextMetadata.token_to_seq", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChunkedContextMetadata.chunk_total_token", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChunkedContextMetadata.padded_local_chunk_seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChunkedContextMetadata.local_context_lens_allranks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChunkedContextMetadata.padded_local_cu_seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChunkedContextMetadata.cu_seq_lens_lst", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChunkedContextMetadata.chunk_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 13, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.mla_attention.reorg_kvcache", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "type_ignores": [ { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "no-redef" ] }, { "kind": "type", "rules": [ "arg-type" ] }, { "kind": "type", "rules": [ "arg-type" ] }, { "kind": "type", "rules": [ "arg-type" ] } ], "name": "vllm.model_executor.layers.attention.mla_attention", "names": [ "vllm.model_executor.layers.attention.mla_attention.A", "vllm.model_executor.layers.attention.mla_attention.CUDNN_WORKSPACE_SIZE", "vllm.model_executor.layers.attention.mla_attention.ChunkedContextMetadata", "vllm.model_executor.layers.attention.mla_attention.CudnnPrefillMetadata", "vllm.model_executor.layers.attention.mla_attention.D", "vllm.model_executor.layers.attention.mla_attention.FlashInferPrefillMetadata", "vllm.model_executor.layers.attention.mla_attention.M", "vllm.model_executor.layers.attention.mla_attention.MLAAttention", "vllm.model_executor.layers.attention.mla_attention.MLACommonBackend", "vllm.model_executor.layers.attention.mla_attention.MLACommonDecodeMetadata", "vllm.model_executor.layers.attention.mla_attention.MLACommonImpl", "vllm.model_executor.layers.attention.mla_attention.MLACommonMetadata", "vllm.model_executor.layers.attention.mla_attention.MLACommonMetadataBuilder", "vllm.model_executor.layers.attention.mla_attention.MLACommonPrefillMetadata", "vllm.model_executor.layers.attention.mla_attention.MLADims", "vllm.model_executor.layers.attention.mla_attention.QueryLenSupport", "vllm.model_executor.layers.attention.mla_attention.backend_supports_prefill_query_quantization", "vllm.model_executor.layers.attention.mla_attention.dynamic_per_batched_tensor_quant", "vllm.model_executor.layers.attention.mla_attention.flash_attn_varlen_func", "vllm.model_executor.layers.attention.mla_attention.get_mla_dims", "vllm.model_executor.layers.attention.mla_attention.is_deepseek_r1_mla_compatible", "vllm.model_executor.layers.attention.mla_attention.is_vllm_fa", "vllm.model_executor.layers.attention.mla_attention.logger", "vllm.model_executor.layers.attention.mla_attention.reorg_kvcache", "vllm.model_executor.layers.attention.mla_attention.unified_mla_attention", "vllm.model_executor.layers.attention.mla_attention.unified_mla_attention_fake", "vllm.model_executor.layers.attention.mla_attention.unified_mla_attention_with_output", "vllm.model_executor.layers.attention.mla_attention.unified_mla_attention_with_output_fake", "vllm.model_executor.layers.attention.mla_attention.unified_mla_kv_cache_update", "vllm.model_executor.layers.attention.mla_attention.unified_mla_kv_cache_update_fake", "vllm.model_executor.layers.attention.mla_attention.use_cudnn_prefill", "vllm.model_executor.layers.attention.mla_attention.use_flashinfer_prefill", "vllm.model_executor.layers.attention.mla_attention.use_trtllm_ragged_deepseek_prefill" ], "n_typable": 318, "n_typed": 199, "n_any": 0, "n_untyped": 119, "n_functions": 14, "n_function_overloads": 14, "n_function_params": 49, "n_methods": 37, "n_method_overloads": 37, "n_method_params": 147, "n_classes": 12, "n_attrs": 124, "n_properties": 0, "n_type_ignores": 5 }, { "path": "vllm/model_executor/layers/attention/static_sink_attention.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.attention.static_sink_attention.StaticSinkAttention", "methods": [ { "kind": "function", "name": "StaticSinkAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "StaticSinkAttention.update_sink_kv", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StaticSinkAttention.forward_native", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "StaticSinkAttention.forward_cuda", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "StaticSinkAttention.forward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StaticSinkAttention.populate_sink_kv", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StaticSinkAttention.get_kv_cache_spec", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StaticSinkAttention.sink_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StaticSinkAttention.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StaticSinkAttention.sink_populated", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StaticSinkAttention.sink_key", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StaticSinkAttention.sink_value", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 19, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 21, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.static_sink_attention.maybe_populate_sink_fake", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.static_sink_attention.maybe_populate_sink", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.attention.static_sink_attention.create_static_sink_attention_backend", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.layers.attention.static_sink_attention.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.attention.static_sink_attention", "names": [ "vllm.model_executor.layers.attention.static_sink_attention.StaticSinkAttention", "vllm.model_executor.layers.attention.static_sink_attention.create_static_sink_attention_backend", "vllm.model_executor.layers.attention.static_sink_attention.logger", "vllm.model_executor.layers.attention.static_sink_attention.maybe_populate_sink", "vllm.model_executor.layers.attention.static_sink_attention.maybe_populate_sink_fake" ], "n_typable": 43, "n_typed": 28, "n_any": 0, "n_untyped": 15, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 6, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 21, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/attention/kv_transfer_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.attention.kv_transfer_utils.maybe_transfer_kv_layer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.attention.kv_transfer_utils", "names": [ "vllm.model_executor.layers.attention.kv_transfer_utils.maybe_transfer_kv_layer" ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/attention_layer_base.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.attention_layer_base.AttentionLayerBase", "methods": [ { "kind": "function", "name": "AttentionLayerBase.get_attn_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionLayerBase.get_kv_cache_spec", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AttentionLayerBase.impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.attention_layer_base", "names": [ "vllm.model_executor.layers.attention_layer_base.AttentionLayerBase" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/batch_invariant.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.mm_batch_invariant", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.mean_kernel", "n_typed": 1, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.rms_norm_batch_invariant", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.vllm_is_batch_invariant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.matmul_kernel_persistent", "n_typed": 9, "n_any": 0, "n_untyped": 14, "n_overloads": 1, "n_typable": 23, "n_params": 22, "n_function_overloads": 1, "n_function_params": 22 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.bmm_batch_invariant", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.log_softmax", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.mean_batch_invariant", "n_typed": 1, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.init_batch_invariance", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.batch_invariant.VLLM_BATCH_INVARIANT", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.matmul_persistent", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.linear_batch_invariant", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.addmm_batch_invariant", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.softmax_batch_invariant", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.override_envs_for_invariance", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.matmul_batch_invariant", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.mean_dim", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.enable_batch_invariant_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.rms_norm", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.model_executor.layers.batch_invariant.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.batch_invariant.bmm_kernel", "n_typed": 6, "n_any": 0, "n_untyped": 17, "n_overloads": 1, "n_typable": 23, "n_params": 22, "n_function_overloads": 1, "n_function_params": 22 } ], "type_ignores": [], "name": "vllm.model_executor.layers.batch_invariant", "names": [ "vllm.model_executor.layers.batch_invariant.VLLM_BATCH_INVARIANT", "vllm.model_executor.layers.batch_invariant.addmm_batch_invariant", "vllm.model_executor.layers.batch_invariant.bmm_batch_invariant", "vllm.model_executor.layers.batch_invariant.bmm_kernel", "vllm.model_executor.layers.batch_invariant.enable_batch_invariant_mode", "vllm.model_executor.layers.batch_invariant.init_batch_invariance", "vllm.model_executor.layers.batch_invariant.linear_batch_invariant", "vllm.model_executor.layers.batch_invariant.log_softmax", "vllm.model_executor.layers.batch_invariant.logger", "vllm.model_executor.layers.batch_invariant.matmul_batch_invariant", "vllm.model_executor.layers.batch_invariant.matmul_kernel_persistent", "vllm.model_executor.layers.batch_invariant.matmul_persistent", "vllm.model_executor.layers.batch_invariant.mean_batch_invariant", "vllm.model_executor.layers.batch_invariant.mean_dim", "vllm.model_executor.layers.batch_invariant.mean_kernel", "vllm.model_executor.layers.batch_invariant.mm_batch_invariant", "vllm.model_executor.layers.batch_invariant.override_envs_for_invariance", "vllm.model_executor.layers.batch_invariant.rms_norm", "vllm.model_executor.layers.batch_invariant.rms_norm_batch_invariant", "vllm.model_executor.layers.batch_invariant.softmax_batch_invariant", "vllm.model_executor.layers.batch_invariant.vllm_is_batch_invariant" ], "n_typable": 114, "n_typed": 40, "n_any": 0, "n_untyped": 74, "n_functions": 19, "n_function_overloads": 19, "n_function_params": 93, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/conv.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.conv.ConvLayerBase", "methods": [ { "kind": "function", "name": "ConvLayerBase.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "ConvLayerBase.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ConvLayerBase.num_dim", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ConvLayerBase.in_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvLayerBase.out_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvLayerBase.kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvLayerBase.stride", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvLayerBase.padding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvLayerBase.dilation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvLayerBase.groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvLayerBase.padding_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvLayerBase.enable_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvLayerBase.input_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvLayerBase.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvLayerBase.bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 13, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.conv.CausalConv2dLayer", "methods": [ { "kind": "function", "name": "CausalConv2dLayer.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "CausalConv2dLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 13, "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.conv.Conv3dLayer", "methods": [ { "kind": "function", "name": "Conv3dLayer._forward_mulmat", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Conv3dLayer._forward_conv", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Conv3dLayer.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Conv3dLayer.forward_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Conv3dLayer.num_dim", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.conv.Conv2dLayer", "methods": [ { "kind": "function", "name": "Conv2dLayer._forward_mulmat", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Conv2dLayer._forward_conv", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Conv2dLayer.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Conv2dLayer.forward_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Conv2dLayer.num_dim", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.conv", "names": [ "vllm.model_executor.layers.conv.CausalConv2dLayer", "vllm.model_executor.layers.conv.Conv2dLayer", "vllm.model_executor.layers.conv.Conv3dLayer", "vllm.model_executor.layers.conv.ConvLayerBase" ], "n_typable": 54, "n_typed": 42, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 29, "n_classes": 4, "n_attrs": 15, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fla/ops/chunk.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.chunk.chunk_gated_delta_rule", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.chunk.chunk_gated_delta_rule_fwd", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "class", "name": "vllm.model_executor.layers.fla.ops.chunk.ChunkGatedDeltaRuleFunction", "methods": [ { "kind": "function", "name": "ChunkGatedDeltaRuleFunction.forward", "n_typed": 10, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 10, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fla.ops.chunk", "names": [ "vllm.model_executor.layers.fla.ops.chunk.ChunkGatedDeltaRuleFunction", "vllm.model_executor.layers.fla.ops.chunk.chunk_gated_delta_rule", "vllm.model_executor.layers.fla.ops.chunk.chunk_gated_delta_rule_fwd" ], "n_typable": 33, "n_typed": 29, "n_any": 0, "n_untyped": 4, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 19, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 11, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fla/ops/fused_recurrent.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.fused_recurrent.fused_recurrent_gated_delta_rule", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.fused_recurrent.fused_recurrent_gated_delta_rule_fwd", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.fused_recurrent.fused_recurrent_gated_delta_rule_fwd_kernel", "n_typed": 21, "n_any": 0, "n_untyped": 13, "n_overloads": 1, "n_typable": 34, "n_params": 33, "n_function_overloads": 1, "n_function_params": 33 }, { "kind": "class", "name": "vllm.model_executor.layers.fla.ops.fused_recurrent.FusedRecurrentFunction", "methods": [ { "kind": "function", "name": "FusedRecurrentFunction.forward", "n_typed": 12, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 } ], "properties": [], "attrs": [], "n_typable": 14, "n_typed": 12, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 13, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fla.ops.fused_recurrent", "names": [ "vllm.model_executor.layers.fla.ops.fused_recurrent.FusedRecurrentFunction", "vllm.model_executor.layers.fla.ops.fused_recurrent.fused_recurrent_gated_delta_rule", "vllm.model_executor.layers.fla.ops.fused_recurrent.fused_recurrent_gated_delta_rule_fwd", "vllm.model_executor.layers.fla.ops.fused_recurrent.fused_recurrent_gated_delta_rule_fwd_kernel" ], "n_typable": 74, "n_typed": 59, "n_any": 0, "n_untyped": 15, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 57, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 13, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fla/ops/layernorm_guard.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fla.ops.layernorm_guard.RMSNormGated", "methods": [ { "kind": "function", "name": "RMSNormGated.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "RMSNormGated.reset_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RMSNormGated.forward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RMSNormGated.eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNormGated.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNormGated.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNormGated.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNormGated.norm_before_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 6, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.layernorm_guard.layer_norm_fwd", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "class", "name": "vllm.model_executor.layers.fla.ops.layernorm_guard.LayerNormGated", "methods": [ { "kind": "function", "name": "LayerNormGated.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "LayerNormGated.reset_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LayerNormGated.forward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LayerNormGated.eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LayerNormGated.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LayerNormGated.bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LayerNormGated.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LayerNormGated.norm_before_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 5, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.layernorm_guard.calc_rows_per_block", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.layernorm_guard.rms_norm_ref", "n_typed": 0, "n_any": 0, "n_untyped": 9, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "class", "name": "vllm.model_executor.layers.fla.ops.layernorm_guard.LayerNormFn", "methods": [ { "kind": "function", "name": "LayerNormFn.forward", "n_typed": 1, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 } ], "properties": [], "attrs": [], "n_typable": 11, "n_typed": 1, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 10, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.layernorm_guard.layernorm_fn", "n_typed": 1, "n_any": 0, "n_untyped": 9, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.layernorm_guard.rmsnorm_fn", "n_typed": 1, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.layernorm_guard.layer_norm_fwd_kernel", "n_typed": 8, "n_any": 0, "n_untyped": 13, "n_overloads": 1, "n_typable": 21, "n_params": 20, "n_function_overloads": 1, "n_function_params": 20 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fla.ops.layernorm_guard", "names": [ "vllm.model_executor.layers.fla.ops.layernorm_guard.LayerNormFn", "vllm.model_executor.layers.fla.ops.layernorm_guard.LayerNormGated", "vllm.model_executor.layers.fla.ops.layernorm_guard.RMSNormGated", "vllm.model_executor.layers.fla.ops.layernorm_guard.calc_rows_per_block", "vllm.model_executor.layers.fla.ops.layernorm_guard.layer_norm_fwd", "vllm.model_executor.layers.fla.ops.layernorm_guard.layer_norm_fwd_kernel", "vllm.model_executor.layers.fla.ops.layernorm_guard.layernorm_fn", "vllm.model_executor.layers.fla.ops.layernorm_guard.rms_norm_ref", "vllm.model_executor.layers.fla.ops.layernorm_guard.rmsnorm_fn" ], "n_typable": 107, "n_typed": 35, "n_any": 0, "n_untyped": 72, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 57, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 27, "n_classes": 3, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fla/ops/chunk_delta_h.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.chunk_delta_h.chunk_gated_delta_rule_fwd_kernel_h_blockdim64", "n_typed": 12, "n_any": 0, "n_untyped": 13, "n_overloads": 1, "n_typable": 25, "n_params": 24, "n_function_overloads": 1, "n_function_params": 24 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.chunk_delta_h.NUM_WARPS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.chunk_delta_h.chunk_gated_delta_rule_fwd_h", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fla.ops.chunk_delta_h", "names": [ "vllm.model_executor.layers.fla.ops.chunk_delta_h.NUM_WARPS", "vllm.model_executor.layers.fla.ops.chunk_delta_h.chunk_gated_delta_rule_fwd_h", "vllm.model_executor.layers.fla.ops.chunk_delta_h.chunk_gated_delta_rule_fwd_kernel_h_blockdim64" ], "n_typable": 36, "n_typed": 23, "n_any": 0, "n_untyped": 13, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 34, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fla/ops/chunk_o.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.chunk_o.chunk_fwd_kernel_o", "n_typed": 9, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 20, "n_params": 19, "n_function_overloads": 1, "n_function_params": 19 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.chunk_o.BKV_LIST", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.chunk_o.NUM_WARPS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.chunk_o.chunk_fwd_o", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fla.ops.chunk_o", "names": [ "vllm.model_executor.layers.fla.ops.chunk_o.BKV_LIST", "vllm.model_executor.layers.fla.ops.chunk_o.NUM_WARPS", "vllm.model_executor.layers.fla.ops.chunk_o.chunk_fwd_kernel_o", "vllm.model_executor.layers.fla.ops.chunk_o.chunk_fwd_o" ], "n_typable": 30, "n_typed": 18, "n_any": 0, "n_untyped": 12, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 27, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fla/ops/chunk_scaled_dot_kkt.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.chunk_scaled_dot_kkt.chunk_scaled_dot_kkt_fwd_kernel", "n_typed": 7, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.chunk_scaled_dot_kkt.chunk_scaled_dot_kkt_fwd", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fla.ops.chunk_scaled_dot_kkt", "names": [ "vllm.model_executor.layers.fla.ops.chunk_scaled_dot_kkt.chunk_scaled_dot_kkt_fwd", "vllm.model_executor.layers.fla.ops.chunk_scaled_dot_kkt.chunk_scaled_dot_kkt_fwd_kernel" ], "n_typable": 22, "n_typed": 14, "n_any": 0, "n_untyped": 8, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 20, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fla/ops/cumsum.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.cumsum.chunk_local_cumsum_vector", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.cumsum.BS_LIST", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.cumsum.chunk_local_cumsum_vector_kernel", "n_typed": 8, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.cumsum.chunk_local_cumsum_scalar", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.cumsum.chunk_local_cumsum_scalar_kernel", "n_typed": 6, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.cumsum.chunk_local_cumsum", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fla.ops.cumsum", "names": [ "vllm.model_executor.layers.fla.ops.cumsum.BS_LIST", "vllm.model_executor.layers.fla.ops.cumsum.chunk_local_cumsum", "vllm.model_executor.layers.fla.ops.cumsum.chunk_local_cumsum_scalar", "vllm.model_executor.layers.fla.ops.cumsum.chunk_local_cumsum_scalar_kernel", "vllm.model_executor.layers.fla.ops.cumsum.chunk_local_cumsum_vector", "vllm.model_executor.layers.fla.ops.cumsum.chunk_local_cumsum_vector_kernel" ], "n_typable": 49, "n_typed": 35, "n_any": 0, "n_untyped": 14, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 43, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fla/ops/index.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.index.prepare_lens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.index.prepare_chunk_offsets", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.index.prepare_chunk_indices", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fla.ops.index", "names": [ "vllm.model_executor.layers.fla.ops.index.prepare_chunk_indices", "vllm.model_executor.layers.fla.ops.index.prepare_chunk_offsets", "vllm.model_executor.layers.fla.ops.index.prepare_lens" ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 5, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fla/ops/kda.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.rms_norm_gated", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.kda.NUM_WARPS_AUTOTUNE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.chunk_gla_fwd_o_gk", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.kda.BT_LIST_AUTOTUNE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.chunk_gla_fwd_kernel_o", "n_typed": 7, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.layer_norm_gated_fwd", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.chunk_kda_fwd", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.layer_norm_gated_fwd_kernel1", "n_typed": 8, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.recompute_w_u_fwd_kernel", "n_typed": 10, "n_any": 0, "n_untyped": 14, "n_overloads": 1, "n_typable": 24, "n_params": 23, "n_function_overloads": 1, "n_function_params": 23 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.chunk_kda_scaled_dot_kkt_fwd_kernel_intra_sub_inter", "n_typed": 7, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.fused_recurrent_kda_fwd", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.kda_gate_fwd_kernel", "n_typed": 6, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.fused_recurrent_kda", "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.recompute_w_u_fwd", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.chunk_kda", "n_typed": 10, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "class", "name": "vllm.model_executor.layers.fla.ops.kda.FusedRMSNormGated", "methods": [ { "kind": "function", "name": "FusedRMSNormGated.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FusedRMSNormGated.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FusedRMSNormGated.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedRMSNormGated.elementwise_affine", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedRMSNormGated.eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedRMSNormGated.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedRMSNormGated.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 13, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.layer_norm_gated_fwd_kernel", "n_typed": 9, "n_any": 0, "n_untyped": 12, "n_overloads": 1, "n_typable": 21, "n_params": 20, "n_function_overloads": 1, "n_function_params": 20 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.chunk_kda_scaled_dot_kkt_fwd_kernel_intra_sub_intra", "n_typed": 6, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.fused_kda_gate", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.kda.chunk_kda_scaled_dot_kkt_fwd", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fla.ops.kda", "names": [ "vllm.model_executor.layers.fla.ops.kda.BT_LIST_AUTOTUNE", "vllm.model_executor.layers.fla.ops.kda.FusedRMSNormGated", "vllm.model_executor.layers.fla.ops.kda.NUM_WARPS_AUTOTUNE", "vllm.model_executor.layers.fla.ops.kda.chunk_gla_fwd_kernel_o", "vllm.model_executor.layers.fla.ops.kda.chunk_gla_fwd_o_gk", "vllm.model_executor.layers.fla.ops.kda.chunk_kda", "vllm.model_executor.layers.fla.ops.kda.chunk_kda_fwd", "vllm.model_executor.layers.fla.ops.kda.chunk_kda_scaled_dot_kkt_fwd", "vllm.model_executor.layers.fla.ops.kda.chunk_kda_scaled_dot_kkt_fwd_kernel_intra_sub_inter", "vllm.model_executor.layers.fla.ops.kda.chunk_kda_scaled_dot_kkt_fwd_kernel_intra_sub_intra", "vllm.model_executor.layers.fla.ops.kda.fused_kda_gate", "vllm.model_executor.layers.fla.ops.kda.fused_recurrent_kda", "vllm.model_executor.layers.fla.ops.kda.fused_recurrent_kda_fwd", "vllm.model_executor.layers.fla.ops.kda.kda_gate_fwd_kernel", "vllm.model_executor.layers.fla.ops.kda.layer_norm_gated_fwd", "vllm.model_executor.layers.fla.ops.kda.layer_norm_gated_fwd_kernel", "vllm.model_executor.layers.fla.ops.kda.layer_norm_gated_fwd_kernel1", "vllm.model_executor.layers.fla.ops.kda.recompute_w_u_fwd", "vllm.model_executor.layers.fla.ops.kda.recompute_w_u_fwd_kernel", "vllm.model_executor.layers.fla.ops.kda.rms_norm_gated" ], "n_typable": 251, "n_typed": 162, "n_any": 0, "n_untyped": 89, "n_functions": 17, "n_function_overloads": 17, "n_function_params": 216, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fla/ops/l2norm.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.l2norm.l2norm_fwd_kernel2", "n_typed": 2, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.l2norm.l2norm_fwd_kernel", "n_typed": 3, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.l2norm.BT_LIST", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.l2norm.USE_DEFAULT_FLA_NORM", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.l2norm.l2norm_fwd_kernel1", "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.l2norm.l2norm_fwd", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fla.ops.l2norm", "names": [ "vllm.model_executor.layers.fla.ops.l2norm.BT_LIST", "vllm.model_executor.layers.fla.ops.l2norm.USE_DEFAULT_FLA_NORM", "vllm.model_executor.layers.fla.ops.l2norm.l2norm_fwd", "vllm.model_executor.layers.fla.ops.l2norm.l2norm_fwd_kernel", "vllm.model_executor.layers.fla.ops.l2norm.l2norm_fwd_kernel1", "vllm.model_executor.layers.fla.ops.l2norm.l2norm_fwd_kernel2" ], "n_typable": 27, "n_typed": 9, "n_any": 0, "n_untyped": 18, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 22, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fla/ops/op.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.op.gather", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.op.make_tensor_descriptor", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fla.ops.op", "names": [ "vllm.model_executor.layers.fla.ops.op.gather", "vllm.model_executor.layers.fla.ops.op.make_tensor_descriptor" ], "n_typable": 11, "n_typed": 0, "n_any": 0, "n_untyped": 11, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 9, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fla/ops/solve_tril.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.solve_tril.solve_tril", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.solve_tril.merge_16x16_to_64x64_inverse_kernel", "n_typed": 5, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.solve_tril.ALLOWED_TRIL_PRECISIONS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.solve_tril.FLA_TRIL_PRECISION", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.solve_tril.merge_16x16_to_32x32_inverse_kernel", "n_typed": 5, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.solve_tril.solve_tril_16x16_kernel", "n_typed": 5, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fla.ops.solve_tril", "names": [ "vllm.model_executor.layers.fla.ops.solve_tril.ALLOWED_TRIL_PRECISIONS", "vllm.model_executor.layers.fla.ops.solve_tril.FLA_TRIL_PRECISION", "vllm.model_executor.layers.fla.ops.solve_tril.merge_16x16_to_32x32_inverse_kernel", "vllm.model_executor.layers.fla.ops.solve_tril.merge_16x16_to_64x64_inverse_kernel", "vllm.model_executor.layers.fla.ops.solve_tril.solve_tril", "vllm.model_executor.layers.fla.ops.solve_tril.solve_tril_16x16_kernel" ], "n_typable": 38, "n_typed": 19, "n_any": 0, "n_untyped": 19, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 33, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fla/ops/utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.SUPPRESS_LEVEL", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.utils.get_all_max_shared_mem", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.utils.check_shared_mem", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.is_amd", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.utils.input_guard", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.is_nvidia", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.utils.tensor_cache", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.device_platform", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.is_nvidia_hopper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.is_gather_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.is_intel", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.utils.get_available_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.FLA_CI_ENV", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.is_intel_alchemist", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.FLA_GDN_FIX_BT", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.use_cuda_graph", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.COMPILER_MODE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fla.ops.utils.Backend", "methods": [ { "kind": "function", "name": "Backend.get_shared_memory", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Backend.ADA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Backend.AMPERE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Backend.HOPPER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Backend.DEFAULT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.is_tma_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fla.ops.utils.device_torch_lib", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fla.ops.utils", "names": [ "vllm.model_executor.layers.fla.ops.utils.Backend", "vllm.model_executor.layers.fla.ops.utils.COMPILER_MODE", "vllm.model_executor.layers.fla.ops.utils.FLA_CI_ENV", "vllm.model_executor.layers.fla.ops.utils.FLA_GDN_FIX_BT", "vllm.model_executor.layers.fla.ops.utils.SUPPRESS_LEVEL", "vllm.model_executor.layers.fla.ops.utils.check_shared_mem", "vllm.model_executor.layers.fla.ops.utils.device", "vllm.model_executor.layers.fla.ops.utils.device_platform", "vllm.model_executor.layers.fla.ops.utils.device_torch_lib", "vllm.model_executor.layers.fla.ops.utils.get_all_max_shared_mem", "vllm.model_executor.layers.fla.ops.utils.get_available_device", "vllm.model_executor.layers.fla.ops.utils.input_guard", "vllm.model_executor.layers.fla.ops.utils.is_amd", "vllm.model_executor.layers.fla.ops.utils.is_gather_supported", "vllm.model_executor.layers.fla.ops.utils.is_intel", "vllm.model_executor.layers.fla.ops.utils.is_intel_alchemist", "vllm.model_executor.layers.fla.ops.utils.is_nvidia", "vllm.model_executor.layers.fla.ops.utils.is_nvidia_hopper", "vllm.model_executor.layers.fla.ops.utils.is_tma_supported", "vllm.model_executor.layers.fla.ops.utils.logger", "vllm.model_executor.layers.fla.ops.utils.tensor_cache", "vllm.model_executor.layers.fla.ops.utils.use_cuda_graph" ], "n_typable": 24, "n_typed": 10, "n_any": 0, "n_untyped": 14, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 4, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_classes": 1, "n_attrs": 20, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fla/ops/wy_fast.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.wy_fast.recompute_w_u_fwd_kernel", "n_typed": 8, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 }, { "kind": "function", "name": "vllm.model_executor.layers.fla.ops.wy_fast.recompute_w_u_fwd", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fla.ops.wy_fast", "names": [ "vllm.model_executor.layers.fla.ops.wy_fast.recompute_w_u_fwd", "vllm.model_executor.layers.fla.ops.wy_fast.recompute_w_u_fwd_kernel" ], "n_typable": 26, "n_typed": 15, "n_any": 0, "n_untyped": 11, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 24, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/activation.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.activation.apply_moe_activation", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.activation.activation_without_mul", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.activation.MoEActivation", "methods": [ { "kind": "function", "name": "MoEActivation.without_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEActivation.from_str", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "MoEActivation.is_gated", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MoEActivation.custom_op_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MoEActivation.SILU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoEActivation.GELU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoEActivation.RELU2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoEActivation.SWIGLUOAI", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoEActivation.SWIGLUSTEP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoEActivation.SILU_NO_MUL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoEActivation.GELU_NO_MUL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoEActivation.RELU2_NO_MUL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 8, "n_properties": 2 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.activation", "names": [ "vllm.model_executor.layers.fused_moe.activation.MoEActivation", "vllm.model_executor.layers.fused_moe.activation.activation_without_mul", "vllm.model_executor.layers.fused_moe.activation.apply_moe_activation" ], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 4, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_classes": 1, "n_attrs": 8, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/xpu_fused_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.xpu_fused_moe.XPUExpertsFp8", "methods": [ { "kind": "function", "name": "XPUExpertsFp8.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "XPUExpertsFp8.is_fp8", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.xpu_fused_moe.XPUExperts", "methods": [ { "kind": "function", "name": "XPUExperts.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "XPUExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUExperts._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUExperts._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUExperts._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XPUExperts._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XPUExperts._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "XPUExperts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUExperts.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUExperts.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "XPUExperts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [ { "kind": "property", "name": "XPUExperts.expects_unquantized_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "XPUExperts.is_fp8", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 45, "n_typed": 42, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 31, "n_attrs": 1, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.xpu_fused_moe", "names": [ "vllm.model_executor.layers.fused_moe.xpu_fused_moe.XPUExperts", "vllm.model_executor.layers.fused_moe.xpu_fused_moe.XPUExpertsFp8" ], "n_typable": 51, "n_typed": 46, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 35, "n_classes": 2, "n_attrs": 2, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/layer.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.layer.FusedMoeWeightScaleSupported", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FusedMoeWeightScaleSupported.TENSOR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoeWeightScaleSupported.CHANNEL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoeWeightScaleSupported.GROUP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoeWeightScaleSupported.BLOCK", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.layer.FusedMoE", "methods": [ { "kind": "function", "name": "FusedMoE.__init__", "n_typed": 32, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 34, "n_params": 33, "n_function_overloads": 1, "n_function_params": 33 }, { "kind": "function", "name": "FusedMoE._init_runner", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoE._replace_quant_method", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoE.maybe_init_modular_kernel", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoE._maybe_init_expert_routing_tables", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoE.ensure_round_robin_expert_routing_tables", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FusedMoE.update_expert_map", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoE._load_per_tensor_weight_scale", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FusedMoE._load_combined_w13_weight_scale", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FusedMoE._load_model_weight_or_group_weight_scale", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FusedMoE._load_per_channel_weight_scale", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FusedMoE._load_w13", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FusedMoE._load_w2", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FusedMoE._load_single_value", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FusedMoE._load_g_idx", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FusedMoE._map_global_expert_id_to_local_expert_id", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoE._init_aiter_shared_experts_topK_buffer", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoE.weight_loader", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 7, "n_params": 6, "n_function_overloads": 2, "n_function_params": 6 }, { "kind": "function", "name": "FusedMoE.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoE.get_expert_weights", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoE.set_eplb_state", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FusedMoE.ensure_moe_quant_config_init", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoE.must_reduce_shared_expert_outputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoE.maybe_all_reduce_tensor_model_parallel", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoE.forward_native", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoE.forward_cuda", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoE.make_expert_params_mapping", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FusedMoE.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "FusedMoE.shared_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoE.layer_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoE.gate", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoE.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoE.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoE.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoE.use_ep", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoE.is_internal_router", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoE.moe_quant_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoE.expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FusedMoE.params_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.is_sequence_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.sp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.moe_parallel_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.global_num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.logical_num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.expert_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.eplb_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.expert_placement_strategy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.rocm_aiter_fmoe_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.aiter_fmoe_shared_expert_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.num_fused_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.intermediate_size_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.reduce_results", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.renormalize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.use_grouped_topk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.num_expert_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.topk_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.custom_routing_function", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.scoring_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.e_score_correction_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.apply_router_weight_on_input", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.routing_method_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.moe_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.quant_method", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.base_quant_method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.use_overlapped", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.runner", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoE.local_num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 180, "n_typed": 124, "n_any": 0, "n_untyped": 56, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 28, "n_method_overloads": 29, "n_method_params": 102, "n_attrs": 39, "n_properties": 11 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.layer.determine_expert_map", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.layer.determine_expert_placement_strategy", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.layer.maybe_roundup_hidden_size", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.layer.get_compressed_expert_map", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.layer.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": [ "attr-defined" ] } ], "name": "vllm.model_executor.layers.fused_moe.layer", "names": [ "vllm.model_executor.layers.fused_moe.layer.FusedMoE", "vllm.model_executor.layers.fused_moe.layer.FusedMoeWeightScaleSupported", "vllm.model_executor.layers.fused_moe.layer.determine_expert_map", "vllm.model_executor.layers.fused_moe.layer.determine_expert_placement_strategy", "vllm.model_executor.layers.fused_moe.layer.get_compressed_expert_map", "vllm.model_executor.layers.fused_moe.layer.logger", "vllm.model_executor.layers.fused_moe.layer.maybe_roundup_hidden_size" ], "n_typable": 203, "n_typed": 146, "n_any": 0, "n_untyped": 57, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 18, "n_methods": 28, "n_method_overloads": 29, "n_method_params": 102, "n_classes": 2, "n_attrs": 44, "n_properties": 11, "n_type_ignores": 1 }, { "path": "vllm/model_executor/layers/fused_moe/__init__.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.get_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.override_config", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.fused_topk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.fused_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe", "names": [ "vllm.model_executor.layers.fused_moe.fused_experts", "vllm.model_executor.layers.fused_moe.fused_topk", "vllm.model_executor.layers.fused_moe.get_config", "vllm.model_executor.layers.fused_moe.override_config" ], "n_typable": 5, "n_typed": 1, "n_any": 0, "n_untyped": 4, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/fused_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.fused_moe.TritonExperts", "methods": [ { "kind": "function", "name": "TritonExperts.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TritonExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonExperts._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonExperts._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonExperts._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TritonExperts._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TritonExperts._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TritonExperts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonExperts.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonExperts.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "TritonExperts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "TritonExperts.moe_sum", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 44, "n_typed": 42, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 31, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.fused_moe.TritonWNA16Experts", "methods": [ { "kind": "function", "name": "TritonWNA16Experts._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonWNA16Experts._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonWNA16Experts._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TritonWNA16Experts._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TritonWNA16Experts._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TritonWNA16Experts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [], "attrs": [], "n_typable": 25, "n_typed": 24, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 19, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.get_config_file_name", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.get_moe_wna16_block_config", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.dispatch_fused_experts_func", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.fused_moe_kernel", "n_typed": 16, "n_any": 0, "n_untyped": 29, "n_overloads": 1, "n_typable": 45, "n_params": 44, "n_function_overloads": 1, "n_function_params": 44 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.torch_vllm_outplace_fused_experts", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.invoke_fused_moe_wna16_triton_kernel", "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.invoke_fused_moe_wna16_cuda_kernel", "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.get_default_config", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.fused_moe_kernel_gptq_awq", "n_typed": 15, "n_any": 0, "n_untyped": 25, "n_overloads": 1, "n_typable": 40, "n_params": 39, "n_function_overloads": 1, "n_function_params": 39 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.outplace_fused_experts", "n_typed": 25, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 25, "n_params": 24, "n_function_overloads": 1, "n_function_params": 24 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.fused_moe.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.try_get_optimal_moe_config", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.dispatch_fused_moe_kernel", "n_typed": 22, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 22, "n_params": 21, "n_function_overloads": 1, "n_function_params": 21 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.inplace_fused_experts", "n_typed": 25, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 25, "n_params": 24, "n_function_overloads": 1, "n_function_params": 24 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.zero_experts_compute_triton", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.invoke_fused_moe_triton_kernel", "n_typed": 20, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 21, "n_params": 20, "n_function_overloads": 1, "n_function_params": 20 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.should_moe_wna16_use_cuda", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.torch_vllm_inplace_fused_experts", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.write_zeros_to_output", "n_typed": 0, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.fused_experts", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.compute_identity_kernel", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.get_moe_configs", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.fused_experts_impl", "n_typed": 26, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 26, "n_params": 25, "n_function_overloads": 1, "n_function_params": 25 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.outplace_fused_experts_fake", "n_typed": 25, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 25, "n_params": 24, "n_function_overloads": 1, "n_function_params": 24 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_moe.inplace_fused_experts_fake", "n_typed": 25, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 25, "n_params": 24, "n_function_overloads": 1, "n_function_params": 24 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.fused_moe", "names": [ "vllm.model_executor.layers.fused_moe.fused_moe.TritonExperts", "vllm.model_executor.layers.fused_moe.fused_moe.TritonWNA16Experts", "vllm.model_executor.layers.fused_moe.fused_moe.compute_identity_kernel", "vllm.model_executor.layers.fused_moe.fused_moe.dispatch_fused_experts_func", "vllm.model_executor.layers.fused_moe.fused_moe.dispatch_fused_moe_kernel", "vllm.model_executor.layers.fused_moe.fused_moe.fused_experts", "vllm.model_executor.layers.fused_moe.fused_moe.fused_experts_impl", "vllm.model_executor.layers.fused_moe.fused_moe.fused_moe_kernel", "vllm.model_executor.layers.fused_moe.fused_moe.fused_moe_kernel_gptq_awq", "vllm.model_executor.layers.fused_moe.fused_moe.get_config_file_name", "vllm.model_executor.layers.fused_moe.fused_moe.get_default_config", "vllm.model_executor.layers.fused_moe.fused_moe.get_moe_configs", "vllm.model_executor.layers.fused_moe.fused_moe.get_moe_wna16_block_config", "vllm.model_executor.layers.fused_moe.fused_moe.inplace_fused_experts", "vllm.model_executor.layers.fused_moe.fused_moe.inplace_fused_experts_fake", "vllm.model_executor.layers.fused_moe.fused_moe.invoke_fused_moe_triton_kernel", "vllm.model_executor.layers.fused_moe.fused_moe.invoke_fused_moe_wna16_cuda_kernel", "vllm.model_executor.layers.fused_moe.fused_moe.invoke_fused_moe_wna16_triton_kernel", "vllm.model_executor.layers.fused_moe.fused_moe.logger", "vllm.model_executor.layers.fused_moe.fused_moe.outplace_fused_experts", "vllm.model_executor.layers.fused_moe.fused_moe.outplace_fused_experts_fake", "vllm.model_executor.layers.fused_moe.fused_moe.should_moe_wna16_use_cuda", "vllm.model_executor.layers.fused_moe.fused_moe.torch_vllm_inplace_fused_experts", "vllm.model_executor.layers.fused_moe.fused_moe.torch_vllm_outplace_fused_experts", "vllm.model_executor.layers.fused_moe.fused_moe.try_get_optimal_moe_config", "vllm.model_executor.layers.fused_moe.fused_moe.write_zeros_to_output", "vllm.model_executor.layers.fused_moe.fused_moe.zero_experts_compute_triton" ], "n_typable": 440, "n_typed": 364, "n_any": 0, "n_untyped": 76, "n_functions": 24, "n_function_overloads": 24, "n_function_params": 346, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 50, "n_classes": 2, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/shared_fused_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.shared_fused_moe.SharedFusedMoE", "methods": [ { "kind": "function", "name": "SharedFusedMoE.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.shared_fused_moe", "names": [ "vllm.model_executor.layers.fused_moe.shared_fused_moe.SharedFusedMoE" ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/modular_kernel.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEExpertsModular", "methods": [ { "kind": "function", "name": "FusedMoEExpertsModular.is_monolithic", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEExpertsModular.moe_problem_size", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FusedMoEExpertsModular.workspace_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEExpertsModular.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "FusedMoEExpertsModular.adjust_N_for_activation", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoEExpertsModular.activation", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FusedMoEExpertsModular.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEExpertsModular.apply", "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [], "attrs": [], "n_typable": 41, "n_typed": 41, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 33, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEActivationFormat", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FusedMoEActivationFormat.Standard", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEActivationFormat.BatchedExperts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEPrepareAndFinalizeModular", "methods": [ { "kind": "function", "name": "FusedMoEPrepareAndFinalizeModular.prepare", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "FusedMoEPrepareAndFinalizeModular.supports_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEPrepareAndFinalizeModular.prepare_async", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "FusedMoEPrepareAndFinalizeModular.finalize", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FusedMoEPrepareAndFinalizeModular.finalize_async", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [], "n_typable": 33, "n_typed": 33, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 28, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEPrepareAndFinalize", "methods": [ { "kind": "function", "name": "FusedMoEPrepareAndFinalize.post_init_setup", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEPrepareAndFinalize.topk_indices_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEPrepareAndFinalize.max_num_tokens_per_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEPrepareAndFinalize.num_dispatchers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEPrepareAndFinalize.output_is_reduced", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "FusedMoEPrepareAndFinalize.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 1, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEKernelMonolithicImpl", "methods": [ { "kind": "function", "name": "FusedMoEKernelMonolithicImpl.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoEKernelMonolithicImpl.apply", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FusedMoEKernelMonolithicImpl.prepare_finalize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEKernelMonolithicImpl.fused_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 15, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 14, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.TopKWeightAndReduce", "methods": [ { "kind": "function", "name": "TopKWeightAndReduce.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.PrepareMonolithicResultType", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEExpertsMonolithic", "methods": [ { "kind": "function", "name": "FusedMoEExpertsMonolithic._supports_routing_method", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FusedMoEExpertsMonolithic._supports_router_logits_dtype", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoEExpertsMonolithic.is_monolithic", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEExpertsMonolithic.apply", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 } ], "properties": [], "attrs": [], "n_typable": 22, "n_typed": 22, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 18, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEKernel", "methods": [ { "kind": "function", "name": "FusedMoEKernel.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FusedMoEKernel._post_init_setup", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEKernel.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEKernel.output_is_reduced", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEKernel.apply_monolithic", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "FusedMoEKernel.apply", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 } ], "properties": [ { "kind": "property", "name": "FusedMoEKernel.is_monolithic", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEKernel.prepare_finalize", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEKernel.fused_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FusedMoEKernel.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEKernel.impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 38, "n_typed": 35, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 27, "n_attrs": 2, "n_properties": 3 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEKernelModularImpl", "methods": [ { "kind": "function", "name": "FusedMoEKernelModularImpl.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FusedMoEKernelModularImpl._chunk_info", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEKernelModularImpl._allocate_buffers", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "FusedMoEKernelModularImpl._slice_output_tensor", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FusedMoEKernelModularImpl._slice_expert_tokens_metadata", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FusedMoEKernelModularImpl._prepare", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FusedMoEKernelModularImpl._fused_experts", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "FusedMoEKernelModularImpl._finalize", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "FusedMoEKernelModularImpl.apply", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FusedMoEKernelModularImpl.prepare_finalize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEKernelModularImpl.fused_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEKernelModularImpl.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEKernelModularImpl.moe_parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEKernelModularImpl.inplace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEKernelModularImpl.is_dp_ep", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 78, "n_typed": 71, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 63, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.ReceiverType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEPrepareAndFinalizeMonolithic", "methods": [ { "kind": "function", "name": "FusedMoEPrepareAndFinalizeMonolithic.prepare", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FusedMoEPrepareAndFinalizeMonolithic.finalize", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.ExpertTokensMetadata", "methods": [ { "kind": "function", "name": "ExpertTokensMetadata.make_from_list", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExpertTokensMetadata.expert_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExpertTokensMetadata.expert_num_tokens_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.PrepareResultType", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEExperts", "methods": [ { "kind": "function", "name": "FusedMoEExperts.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FusedMoEExperts.is_monolithic", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEExperts.is_supported_config", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FusedMoEExperts._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEExperts._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEExperts._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoEExperts._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEExperts._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEExperts._supports_routing_method", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FusedMoEExperts._supports_router_logits_dtype", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoEExperts._supports_shape", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEExperts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEExperts.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEExperts.supports_packed_ue8m0_act_scales", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEExperts.enable_chunking", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "FusedMoEExperts.expects_unquantized_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.quant_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.weight_quant_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.block_shape", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.per_act_token_quant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.per_out_ch_quant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.a1_scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.a2_scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.a1_gscale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.a2_gscale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.w1_scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.w2_scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.w1_zp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.w2_zp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.w1_bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.w2_bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.g1_alphas", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEExperts.g2_alphas", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FusedMoEExperts.moe_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEExperts.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEExperts.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEExperts.num_dispatchers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 57, "n_typed": 51, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 19, "n_attrs": 4, "n_properties": 18 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.modular_kernel", "names": [ "vllm.model_executor.layers.fused_moe.modular_kernel.ExpertTokensMetadata", "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEActivationFormat", "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEExperts", "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEExpertsModular", "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEExpertsMonolithic", "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEKernel", "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEKernelModularImpl", "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEKernelMonolithicImpl", "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEPrepareAndFinalize", "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEPrepareAndFinalizeModular", "vllm.model_executor.layers.fused_moe.modular_kernel.FusedMoEPrepareAndFinalizeMonolithic", "vllm.model_executor.layers.fused_moe.modular_kernel.PrepareMonolithicResultType", "vllm.model_executor.layers.fused_moe.modular_kernel.PrepareResultType", "vllm.model_executor.layers.fused_moe.modular_kernel.ReceiverType", "vllm.model_executor.layers.fused_moe.modular_kernel.TopKWeightAndReduce", "vllm.model_executor.layers.fused_moe.modular_kernel.logger" ], "n_typable": 312, "n_typed": 291, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 59, "n_method_overloads": 59, "n_method_params": 215, "n_classes": 12, "n_attrs": 22, "n_properties": 22, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/router/grouped_topk_router.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.router.grouped_topk_router.GroupedTopk", "methods": [ { "kind": "function", "name": "GroupedTopk.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "GroupedTopk.forward_native", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GroupedTopk.forward_cuda", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GroupedTopk.forward_hip", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GroupedTopk.native_impl", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupedTopk.topk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupedTopk.renormalize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupedTopk.num_expert_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupedTopk.topk_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupedTopk.scoring_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupedTopk.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupedTopk.num_fused_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 20, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 16, "n_attrs": 8, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.router.grouped_topk_router.fused_grouped_topk", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.router.grouped_topk_router.grouped_topk", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.router.grouped_topk_router.GroupedTopKRouter", "methods": [ { "kind": "function", "name": "GroupedTopKRouter.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "GroupedTopKRouter._compute_routing", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "GroupedTopKRouter.routing_method_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "GroupedTopKRouter.num_expert_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupedTopKRouter.topk_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupedTopKRouter.renormalize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupedTopKRouter.scoring_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupedTopKRouter.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupedTopKRouter.e_score_correction_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GroupedTopKRouter.num_fused_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 17, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 15, "n_attrs": 7, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.router.grouped_topk_router", "names": [ "vllm.model_executor.layers.fused_moe.router.grouped_topk_router.GroupedTopKRouter", "vllm.model_executor.layers.fused_moe.router.grouped_topk_router.GroupedTopk", "vllm.model_executor.layers.fused_moe.router.grouped_topk_router.fused_grouped_topk", "vllm.model_executor.layers.fused_moe.router.grouped_topk_router.grouped_topk" ], "n_typable": 73, "n_typed": 57, "n_any": 0, "n_untyped": 16, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 18, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 31, "n_classes": 2, "n_attrs": 15, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/cutlass_moe.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.cutlass_moe.cutlass_moe_w4a8_fp8", "n_typed": 21, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 21, "n_params": 20, "n_function_overloads": 1, "n_function_params": 20 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.cutlass_moe.CutlassExpertsFp8", "methods": [ { "kind": "function", "name": "CutlassExpertsFp8.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsFp8._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassExpertsFp8.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsFp8.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsFp8.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsFp8.workspace_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassExpertsFp8.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [], "attrs": [], "n_typable": 17, "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 10, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.cutlass_moe.CutlassExpertsW4A8Fp8", "methods": [ { "kind": "function", "name": "CutlassExpertsW4A8Fp8.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "CutlassExpertsW4A8Fp8.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsW4A8Fp8._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsW4A8Fp8._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsW4A8Fp8._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CutlassExpertsW4A8Fp8._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassExpertsW4A8Fp8._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassExpertsW4A8Fp8.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsW4A8Fp8.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsW4A8Fp8.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsW4A8Fp8.workspace_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassExpertsW4A8Fp8.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "CutlassExpertsW4A8Fp8.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CutlassExpertsW4A8Fp8.out_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CutlassExpertsW4A8Fp8.a_strides1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CutlassExpertsW4A8Fp8.a_strides2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CutlassExpertsW4A8Fp8.b_strides1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CutlassExpertsW4A8Fp8.b_strides2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CutlassExpertsW4A8Fp8.c_strides1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CutlassExpertsW4A8Fp8.c_strides2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CutlassExpertsW4A8Fp8.s_strides1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CutlassExpertsW4A8Fp8.s_strides2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CutlassExpertsW4A8Fp8.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 63, "n_typed": 51, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 40, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.cutlass_moe.CutlassBatchedExpertsFp8", "methods": [ { "kind": "function", "name": "CutlassBatchedExpertsFp8._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassBatchedExpertsFp8.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassBatchedExpertsFp8.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassBatchedExpertsFp8.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassBatchedExpertsFp8.workspace_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassBatchedExpertsFp8.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [], "attrs": [], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 10, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.cutlass_moe.run_cutlass_moe_fp8", "n_typed": 24, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 25, "n_params": 24, "n_function_overloads": 1, "n_function_params": 24 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.cutlass_moe.run_cutlass_moe_w4a8_fp8", "n_typed": 31, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 32, "n_params": 31, "n_function_overloads": 1, "n_function_params": 31 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.cutlass_moe.CutlassExpertsFp8Base", "methods": [ { "kind": "function", "name": "CutlassExpertsFp8Base.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CutlassExpertsFp8Base._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsFp8Base._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsFp8Base._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CutlassExpertsFp8Base._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassExpertsFp8Base.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsFp8Base.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CutlassExpertsFp8Base.out_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CutlassExpertsFp8Base.ab_strides1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CutlassExpertsFp8Base.ab_strides2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CutlassExpertsFp8Base.c_strides1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CutlassExpertsFp8Base.c_strides2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 27, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 22, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.cutlass_moe.FLOAT4_E2M1_MAX", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.cutlass_moe.run_cutlass_moe_fp4", "n_typed": 22, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 22, "n_params": 21, "n_function_overloads": 1, "n_function_params": 21 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.cutlass_moe.CutlassExpertsFp4", "methods": [ { "kind": "function", "name": "CutlassExpertsFp4._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsFp4._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsFp4._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CutlassExpertsFp4._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassExpertsFp4._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassExpertsFp4.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsFp4.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsFp4.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsFp4.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassExpertsFp4.workspace_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CutlassExpertsFp4.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "CutlassExpertsFp4.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [ { "kind": "property", "name": "CutlassExpertsFp4.expects_unquantized_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 41, "n_typed": 40, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 28, "n_attrs": 0, "n_properties": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.cutlass_moe.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.cutlass_moe", "names": [ "vllm.model_executor.layers.fused_moe.cutlass_moe.CutlassBatchedExpertsFp8", "vllm.model_executor.layers.fused_moe.cutlass_moe.CutlassExpertsFp4", "vllm.model_executor.layers.fused_moe.cutlass_moe.CutlassExpertsFp8", "vllm.model_executor.layers.fused_moe.cutlass_moe.CutlassExpertsFp8Base", "vllm.model_executor.layers.fused_moe.cutlass_moe.CutlassExpertsW4A8Fp8", "vllm.model_executor.layers.fused_moe.cutlass_moe.FLOAT4_E2M1_MAX", "vllm.model_executor.layers.fused_moe.cutlass_moe.cutlass_moe_w4a8_fp8", "vllm.model_executor.layers.fused_moe.cutlass_moe.logger", "vllm.model_executor.layers.fused_moe.cutlass_moe.run_cutlass_moe_fp4", "vllm.model_executor.layers.fused_moe.cutlass_moe.run_cutlass_moe_fp8", "vllm.model_executor.layers.fused_moe.cutlass_moe.run_cutlass_moe_w4a8_fp8" ], "n_typable": 273, "n_typed": 249, "n_any": 0, "n_untyped": 24, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 96, "n_methods": 45, "n_method_overloads": 45, "n_method_params": 110, "n_classes": 5, "n_attrs": 17, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/router/gate_linear.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.router.gate_linear.GateLinear", "methods": [ { "kind": "function", "name": "GateLinear.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "GateLinear.set_out_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GateLinear.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GateLinear.DSV3_SUPPORTED_NUM_EXPERTS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GateLinear.DSV3_SUPPORTED_HIDDEN_SIZES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GateLinear.out_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GateLinear.allow_specialized_router_gemm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GateLinear.allow_dsv3_router_gemm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GateLinear.allow_cublas_router_gemm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.router.gate_linear", "names": [ "vllm.model_executor.layers.fused_moe.router.gate_linear.GateLinear" ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/rocm_aiter_fused_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe.AiterExperts", "methods": [ { "kind": "function", "name": "AiterExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterExperts._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterExperts._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterExperts._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AiterExperts._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AiterExperts._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AiterExperts.supports_expert_map", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterExperts.supports_chunking", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterExperts.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "AiterExperts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [ { "kind": "property", "name": "AiterExperts.expects_unquantized_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 39, "n_typed": 36, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 27, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe.ActivationMethod", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ActivationMethod.SILU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ActivationMethod.GELU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe.QuantMethod", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "QuantMethod.NO", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QuantMethod.PER_TENSOR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QuantMethod.PER_TOKEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QuantMethod.BLOCK_1X32", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QuantMethod.BLOCK_1X128", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QuantMethod.BLOCK_128x128", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe.init_aiter_topK_meta_data", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe.rocm_aiter_grouped_topk", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe.rocm_aiter_fused_experts", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe.aiter_topK_meta_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe", "names": [ "vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe.ActivationMethod", "vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe.AiterExperts", "vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe.QuantMethod", "vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe.aiter_topK_meta_data", "vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe.init_aiter_topK_meta_data", "vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe.rocm_aiter_fused_experts", "vllm.model_executor.layers.fused_moe.rocm_aiter_fused_moe.rocm_aiter_grouped_topk" ], "n_typable": 72, "n_typed": 68, "n_any": 0, "n_untyped": 4, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 30, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 27, "n_classes": 3, "n_attrs": 9, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/triton_deep_gemm_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.triton_deep_gemm_moe.TritonOrDeepGemmExperts", "methods": [ { "kind": "function", "name": "TritonOrDeepGemmExperts.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TritonOrDeepGemmExperts.get_clses", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonOrDeepGemmExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "TritonOrDeepGemmExperts._select_experts_impl", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 17, "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.triton_deep_gemm_moe", "names": [ "vllm.model_executor.layers.fused_moe.triton_deep_gemm_moe.TritonOrDeepGemmExperts" ], "n_typable": 17, "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/batched_deep_gemm_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.batched_deep_gemm_moe.BatchedDeepGemmExperts", "methods": [ { "kind": "function", "name": "BatchedDeepGemmExperts.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BatchedDeepGemmExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedDeepGemmExperts._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedDeepGemmExperts._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedDeepGemmExperts._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BatchedDeepGemmExperts._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BatchedDeepGemmExperts._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BatchedDeepGemmExperts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedDeepGemmExperts.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedDeepGemmExperts.supports_packed_ue8m0_act_scales", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedDeepGemmExperts.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedDeepGemmExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "BatchedDeepGemmExperts.estimate_expected_m", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BatchedDeepGemmExperts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [], "attrs": [], "n_typable": 48, "n_typed": 46, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 34, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.batched_deep_gemm_moe.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.batched_deep_gemm_moe.scales_shape_stride_dtype", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.batched_deep_gemm_moe.persistent_masked_m_silu_mul_quant", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.batched_deep_gemm_moe", "names": [ "vllm.model_executor.layers.fused_moe.batched_deep_gemm_moe.BatchedDeepGemmExperts", "vllm.model_executor.layers.fused_moe.batched_deep_gemm_moe.logger", "vllm.model_executor.layers.fused_moe.batched_deep_gemm_moe.persistent_masked_m_silu_mul_quant", "vllm.model_executor.layers.fused_moe.batched_deep_gemm_moe.scales_shape_stride_dtype" ], "n_typable": 60, "n_typed": 56, "n_any": 0, "n_untyped": 4, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 9, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 34, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/fused_batched_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.fused_batched_moe.BatchedTritonExperts", "methods": [ { "kind": "function", "name": "BatchedTritonExperts.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BatchedTritonExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedTritonExperts._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedTritonExperts._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedTritonExperts._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BatchedTritonExperts._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BatchedTritonExperts._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BatchedTritonExperts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedTritonExperts.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedTritonExperts.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedTritonExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "BatchedTritonExperts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [], "attrs": [], "n_typable": 43, "n_typed": 41, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 31, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.fused_batched_moe.BatchedPrepareAndFinalize", "methods": [ { "kind": "function", "name": "BatchedPrepareAndFinalize.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BatchedPrepareAndFinalize.max_num_tokens_per_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedPrepareAndFinalize.topk_indices_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedPrepareAndFinalize.num_dispatchers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedPrepareAndFinalize.output_is_reduced", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedPrepareAndFinalize.prepare", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "BatchedPrepareAndFinalize.finalize", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "BatchedPrepareAndFinalize.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "BatchedPrepareAndFinalize.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BatchedPrepareAndFinalize.num_local_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BatchedPrepareAndFinalize.rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BatchedPrepareAndFinalize.num_dispatchers_", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 25, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 18, "n_attrs": 4, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.fused_batched_moe.NaiveBatchedExperts", "methods": [ { "kind": "function", "name": "NaiveBatchedExperts.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NaiveBatchedExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NaiveBatchedExperts._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NaiveBatchedExperts._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NaiveBatchedExperts._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NaiveBatchedExperts._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NaiveBatchedExperts._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NaiveBatchedExperts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NaiveBatchedExperts.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NaiveBatchedExperts.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NaiveBatchedExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "NaiveBatchedExperts.dequant", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NaiveBatchedExperts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [], "attrs": [], "n_typable": 46, "n_typed": 44, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 33, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_batched_moe.batched_moe_kernel_quantize_input", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_batched_moe.moe_mmk", "n_typed": 17, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 28, "n_params": 27, "n_function_overloads": 1, "n_function_params": 27 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_batched_moe.batched_triton_kernel", "n_typed": 24, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 35, "n_params": 34, "n_function_overloads": 1, "n_function_params": 34 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_batched_moe.expert_triton_kernel", "n_typed": 19, "n_any": 0, "n_untyped": 14, "n_overloads": 1, "n_typable": 33, "n_params": 32, "n_function_overloads": 1, "n_function_params": 32 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_batched_moe.invoke_moe_batched_triton_kernel", "n_typed": 14, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.fused_batched_moe", "names": [ "vllm.model_executor.layers.fused_moe.fused_batched_moe.BatchedPrepareAndFinalize", "vllm.model_executor.layers.fused_moe.fused_batched_moe.BatchedTritonExperts", "vllm.model_executor.layers.fused_moe.fused_batched_moe.NaiveBatchedExperts", "vllm.model_executor.layers.fused_moe.fused_batched_moe.batched_moe_kernel_quantize_input", "vllm.model_executor.layers.fused_moe.fused_batched_moe.batched_triton_kernel", "vllm.model_executor.layers.fused_moe.fused_batched_moe.expert_triton_kernel", "vllm.model_executor.layers.fused_moe.fused_batched_moe.invoke_moe_batched_triton_kernel", "vllm.model_executor.layers.fused_moe.fused_batched_moe.moe_mmk" ], "n_typable": 240, "n_typed": 194, "n_any": 0, "n_untyped": 46, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 116, "n_methods": 32, "n_method_overloads": 32, "n_method_params": 82, "n_classes": 3, "n_attrs": 4, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/config.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.config.RoutingMethodType", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RoutingMethodType.Default", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RoutingMethodType.Renormalize", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RoutingMethodType.DeepSeekV3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RoutingMethodType.Llama4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RoutingMethodType.RenormalizeNaive", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RoutingMethodType.TopK", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RoutingMethodType.Custom", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RoutingMethodType.Simulated", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RoutingMethodType.Unspecified", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.config.FusedMoEConfig", "methods": [ { "kind": "function", "name": "FusedMoEConfig.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "FusedMoEConfig.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEConfig.dp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEConfig.pcp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEConfig.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEConfig.sp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEConfig.is_sequence_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEConfig.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEConfig.dp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEConfig.pcp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEConfig.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEConfig.use_ep", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEConfig.use_deepep_ht_kernels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEConfig.use_deepep_ll_kernels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEConfig.use_mori_kernels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEConfig.use_fi_all2allv_kernels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEConfig.use_naive_all2all_kernels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FusedMoEConfig.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.experts_per_token", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.hidden_dim", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.intermediate_size_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.num_local_experts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.num_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.activation", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.device", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.routing_method", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.moe_parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.in_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.router_logits_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.moe_backend", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.has_bias", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.is_act_and_mul", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.is_lora_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEConfig.disable_inplace", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 17, "n_typed": 0, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 18, "n_properties": 16 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.get_routing_method_type", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.awq_marlin_moe_quant_config", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.mxfp4_w4a16_moe_quant_config", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.nvfp4_moe_quant_config", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.fp8_w8a8_moe_quant_config", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.int4_w4a16_moe_quant_config", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.config.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.config.FusedMoEQuantDesc", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FusedMoEQuantDesc.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEQuantDesc.shape", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEQuantDesc.scale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEQuantDesc.alpha_or_gscale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEQuantDesc.zp", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEQuantDesc.bias", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.biased_moe_quant_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.ocp_mx_moe_quant_config", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.gptq_marlin_moe_quant_config", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.int8_w8a16_moe_quant_config", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.mxfp4_mxfp8_moe_quant_config", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.mxfp4_w4a8_moe_quant_config", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.config.FusedMoEParallelConfig", "methods": [ { "kind": "function", "name": "FusedMoEParallelConfig.flatten_tp_across_dp_and_pcp", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FusedMoEParallelConfig.make", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FusedMoEParallelConfig.make_no_parallel", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "FusedMoEParallelConfig.is_sequence_parallel", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEParallelConfig.use_all2all_kernels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEParallelConfig.use_deepep_ht_kernels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEParallelConfig.use_deepep_ll_kernels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEParallelConfig.use_fi_all2allv_kernels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEParallelConfig.use_batched_activation_format", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEParallelConfig.use_naive_all2all_kernels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEParallelConfig.use_mori_kernels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FusedMoEParallelConfig.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEParallelConfig.pcp_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEParallelConfig.dp_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEParallelConfig.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEParallelConfig.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEParallelConfig.pcp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEParallelConfig.dp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEParallelConfig.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEParallelConfig.sp_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEParallelConfig.use_ep", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEParallelConfig.all2all_backend", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEParallelConfig.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 21, "n_typed": 14, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 12, "n_properties": 8 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.int4_w4afp8_moe_quant_config", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.nvfp4_w4a16_moe_quant_config", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.int8_w8a8_moe_quant_config", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.config.FUSED_MOE_UNQUANTIZED_CONFIG", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.config.FusedMoEQuantConfig", "methods": [ { "kind": "function", "name": "FusedMoEQuantConfig.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEQuantConfig.config_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEQuantConfig.scale_shape", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoEQuantConfig.batched_scale_shape", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FusedMoEQuantConfig.make", "n_typed": 19, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 } ], "properties": [ { "kind": "property", "name": "FusedMoEQuantConfig.quant_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.weight_quant_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.is_quantized", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.is_per_act_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.per_act_token_quant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.per_out_ch_quant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.is_per_tensor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.block_shape", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.is_block_quantized", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.a1_scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.a1_gscale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.a2_scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.a2_gscale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.w1_scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.w1_zp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.w1_bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.w1_precision", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.g1_alphas", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.w2_scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.w2_zp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.w2_bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.w2_precision", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.g2_alphas", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.use_fp8_w8a8", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.use_int8_w8a8", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.use_int8_w8a16", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.use_fp8_w8a16", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.use_int4_w4a16", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.use_nvfp4_w4a16", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.ocp_mx_scheme", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.use_mxfp4_w4a16", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.use_mxfp4_w4a4", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.use_nvfp4_w4a4", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEQuantConfig.use_mxfp4_w4a8", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FusedMoEQuantConfig._a1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEQuantConfig._a2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEQuantConfig._w1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEQuantConfig._w2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedMoEQuantConfig.is_nvfp4_scale_swizzled", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 63, "n_typed": 62, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 24, "n_attrs": 5, "n_properties": 34 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.config.fp8_w8a16_moe_quant_config", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.config", "names": [ "vllm.model_executor.layers.fused_moe.config.FUSED_MOE_UNQUANTIZED_CONFIG", "vllm.model_executor.layers.fused_moe.config.FusedMoEConfig", "vllm.model_executor.layers.fused_moe.config.FusedMoEParallelConfig", "vllm.model_executor.layers.fused_moe.config.FusedMoEQuantConfig", "vllm.model_executor.layers.fused_moe.config.FusedMoEQuantDesc", "vllm.model_executor.layers.fused_moe.config.RoutingMethodType", "vllm.model_executor.layers.fused_moe.config.awq_marlin_moe_quant_config", "vllm.model_executor.layers.fused_moe.config.biased_moe_quant_config", "vllm.model_executor.layers.fused_moe.config.fp8_w8a16_moe_quant_config", "vllm.model_executor.layers.fused_moe.config.fp8_w8a8_moe_quant_config", "vllm.model_executor.layers.fused_moe.config.get_routing_method_type", "vllm.model_executor.layers.fused_moe.config.gptq_marlin_moe_quant_config", "vllm.model_executor.layers.fused_moe.config.int4_w4a16_moe_quant_config", "vllm.model_executor.layers.fused_moe.config.int4_w4afp8_moe_quant_config", "vllm.model_executor.layers.fused_moe.config.int8_w8a16_moe_quant_config", "vllm.model_executor.layers.fused_moe.config.int8_w8a8_moe_quant_config", "vllm.model_executor.layers.fused_moe.config.logger", "vllm.model_executor.layers.fused_moe.config.mxfp4_mxfp8_moe_quant_config", "vllm.model_executor.layers.fused_moe.config.mxfp4_w4a16_moe_quant_config", "vllm.model_executor.layers.fused_moe.config.mxfp4_w4a8_moe_quant_config", "vllm.model_executor.layers.fused_moe.config.nvfp4_moe_quant_config", "vllm.model_executor.layers.fused_moe.config.nvfp4_w4a16_moe_quant_config", "vllm.model_executor.layers.fused_moe.config.ocp_mx_moe_quant_config" ], "n_typable": 222, "n_typed": 195, "n_any": 0, "n_untyped": 27, "n_functions": 16, "n_function_overloads": 16, "n_function_params": 103, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 34, "n_classes": 5, "n_attrs": 52, "n_properties": 58, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/zero_expert_fused_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.zero_expert_fused_moe.ZeroExpertFusedMoE", "methods": [ { "kind": "function", "name": "ZeroExpertFusedMoE.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ZeroExpertFusedMoE._temporarily_set_attrs", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ZeroExpertFusedMoE._compute_zero_expert_result", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ZeroExpertFusedMoE.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ZeroExpertFusedMoE.zero_expert_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ZeroExpertFusedMoE.zero_expert_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ZeroExpertFusedMoE.custom_routing_function", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 10, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.zero_expert_fused_moe", "names": [ "vllm.model_executor.layers.fused_moe.zero_expert_fused_moe.ZeroExpertFusedMoE" ], "n_typable": 17, "n_typed": 10, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/deep_gemm_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.deep_gemm_moe.DeepGemmExperts", "methods": [ { "kind": "function", "name": "DeepGemmExperts.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepGemmExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepGemmExperts._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepGemmExperts._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepGemmExperts._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepGemmExperts._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepGemmExperts._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepGemmExperts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepGemmExperts.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepGemmExperts.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepGemmExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "DeepGemmExperts._act_mul_quant", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepGemmExperts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [], "attrs": [], "n_typable": 45, "n_typed": 43, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 32, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.deep_gemm_moe.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.deep_gemm_moe", "names": [ "vllm.model_executor.layers.fused_moe.deep_gemm_moe.DeepGemmExperts", "vllm.model_executor.layers.fused_moe.deep_gemm_moe.logger" ], "n_typable": 46, "n_typed": 43, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 32, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/router/fused_moe_router.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.router.fused_moe_router.FusedMoERouter", "methods": [ { "kind": "function", "name": "FusedMoERouter.select_experts", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "FusedMoERouter.routing_method_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.router.fused_moe_router", "names": [ "vllm.model_executor.layers.fused_moe.router.fused_moe_router.FusedMoERouter" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_classes": 1, "n_attrs": 0, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/unquantized_fused_moe_method.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.unquantized_fused_moe_method.UnquantizedFusedMoEMethod", "methods": [ { "kind": "function", "name": "UnquantizedFusedMoEMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UnquantizedFusedMoEMethod._select_monolithic", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UnquantizedFusedMoEMethod.forward_native", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "UnquantizedFusedMoEMethod.maybe_make_prepare_finalize", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UnquantizedFusedMoEMethod.select_gemm_impl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "UnquantizedFusedMoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "UnquantizedFusedMoEMethod._maybe_pad_weight", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UnquantizedFusedMoEMethod._setup_kernel", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "UnquantizedFusedMoEMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UnquantizedFusedMoEMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "UnquantizedFusedMoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UnquantizedFusedMoEMethod.forward_cuda", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "UnquantizedFusedMoEMethod.forward_monolithic_cuda", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "UnquantizedFusedMoEMethod.forward_monolithic_cpu", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "UnquantizedFusedMoEMethod.is_monolithic", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "UnquantizedFusedMoEMethod.supports_eplb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "UnquantizedFusedMoEMethod.unquantized_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UnquantizedFusedMoEMethod.rocm_aiter_moe_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UnquantizedFusedMoEMethod.kernel", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UnquantizedFusedMoEMethod.apply_monolithic", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 57, "n_typed": 52, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 37, "n_attrs": 4, "n_properties": 2 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.unquantized_fused_moe_method.TritonExperts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.unquantized_fused_moe_method.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": null } ], "name": "vllm.model_executor.layers.fused_moe.unquantized_fused_moe_method", "names": [ "vllm.model_executor.layers.fused_moe.unquantized_fused_moe_method.TritonExperts", "vllm.model_executor.layers.fused_moe.unquantized_fused_moe_method.UnquantizedFusedMoEMethod", "vllm.model_executor.layers.fused_moe.unquantized_fused_moe_method.logger" ], "n_typable": 58, "n_typed": 52, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 37, "n_classes": 1, "n_attrs": 6, "n_properties": 2, "n_type_ignores": 1 }, { "path": "vllm/model_executor/layers/fused_moe/fused_moe_method_base.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.fused_moe_method_base.FusedMoEMethodBase", "methods": [ { "kind": "function", "name": "FusedMoEMethodBase.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEMethodBase.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FusedMoEMethodBase.uses_weight_scale_2_pattern", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FusedMoEMethodBase.maybe_make_prepare_finalize", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEMethodBase.select_gemm_impl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoEMethodBase.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEMethodBase.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FusedMoEMethodBase.apply_monolithic", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "FusedMoEMethodBase.supports_internal_mk", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEMethodBase.mk_owns_shared_expert", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEMethodBase.topk_indices_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEMethodBase.supports_eplb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEMethodBase.method_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEMethodBase.is_monolithic", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FusedMoEMethodBase.moe", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEMethodBase.moe_quant_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEMethodBase.moe_kernel", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 36, "n_typed": 33, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 19, "n_attrs": 3, "n_properties": 6 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.fused_moe_method_base.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.fused_moe_method_base", "names": [ "vllm.model_executor.layers.fused_moe.fused_moe_method_base.FusedMoEMethodBase", "vllm.model_executor.layers.fused_moe.fused_moe_method_base.logger" ], "n_typable": 37, "n_typed": 33, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 19, "n_classes": 1, "n_attrs": 4, "n_properties": 6, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/all2all_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.all2all_utils.maybe_roundup_layer_hidden_size", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.all2all_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.all2all_utils.maybe_make_prepare_finalize", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.all2all_utils", "names": [ "vllm.model_executor.layers.fused_moe.all2all_utils.logger", "vllm.model_executor.layers.fused_moe.all2all_utils.maybe_make_prepare_finalize", "vllm.model_executor.layers.fused_moe.all2all_utils.maybe_roundup_layer_hidden_size" ], "n_typable": 11, "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 8, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/cpu_fused_moe.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.cpu_fused_moe.select_experts", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.cpu_fused_moe.CPUFusedMOE", "methods": [ { "kind": "function", "name": "CPUFusedMOE.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUFusedMOE.__call__", "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "CPUFusedMOE.check_grouped_gemm", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUFusedMOE.init_moe_grouped_gemm", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUFusedMOE.init_moe_torch", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUFusedMOE.forward_grouped_gemm", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "CPUFusedMOE.forward_torch", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CPUFusedMOE.isa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUFusedMOE.forward_method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 43, "n_typed": 41, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 34, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.cpu_fused_moe.grouped_topk", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.cpu_fused_moe.cpu_fused_moe_torch", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.cpu_fused_moe.SGLFusedMOE", "methods": [ { "kind": "function", "name": "SGLFusedMOE.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SGLFusedMOE.__call__", "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 } ], "properties": [], "attrs": [], "n_typable": 19, "n_typed": 19, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 17, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.cpu_fused_moe", "names": [ "vllm.model_executor.layers.fused_moe.cpu_fused_moe.CPUFusedMOE", "vllm.model_executor.layers.fused_moe.cpu_fused_moe.SGLFusedMOE", "vllm.model_executor.layers.fused_moe.cpu_fused_moe.cpu_fused_moe_torch", "vllm.model_executor.layers.fused_moe.cpu_fused_moe.grouped_topk", "vllm.model_executor.layers.fused_moe.cpu_fused_moe.select_experts" ], "n_typable": 93, "n_typed": 91, "n_any": 0, "n_untyped": 2, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 28, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 51, "n_classes": 2, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/deep_gemm_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.deep_gemm_utils.apply_expert_map", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.deep_gemm_utils.ep_gather", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.deep_gemm_utils.expert_num_tokens_round_up_and_sum", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.deep_gemm_utils.ep_scatter", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.deep_gemm_utils.deepgemm_moe_permute", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.deep_gemm_utils.compute_aligned_M", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.deep_gemm_utils.round_up_128", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.deep_gemm_utils.deepgemm_unpermute_and_reduce", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.deep_gemm_utils", "names": [ "vllm.model_executor.layers.fused_moe.deep_gemm_utils.apply_expert_map", "vllm.model_executor.layers.fused_moe.deep_gemm_utils.compute_aligned_M", "vllm.model_executor.layers.fused_moe.deep_gemm_utils.deepgemm_moe_permute", "vllm.model_executor.layers.fused_moe.deep_gemm_utils.deepgemm_unpermute_and_reduce", "vllm.model_executor.layers.fused_moe.deep_gemm_utils.ep_gather", "vllm.model_executor.layers.fused_moe.deep_gemm_utils.ep_scatter", "vllm.model_executor.layers.fused_moe.deep_gemm_utils.expert_num_tokens_round_up_and_sum", "vllm.model_executor.layers.fused_moe.deep_gemm_utils.round_up_128" ], "n_typable": 47, "n_typed": 39, "n_any": 0, "n_untyped": 8, "n_functions": 8, "n_function_overloads": 8, "n_function_params": 39, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/deepep_ht_prepare_finalize.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.deepep_ht_prepare_finalize.DeepEPHTPrepareAndFinalize", "methods": [ { "kind": "function", "name": "DeepEPHTPrepareAndFinalize.maybe_roundup_layer_hidden_size", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepEPHTPrepareAndFinalize.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepEPHTPrepareAndFinalize.num_dispatchers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepEPHTPrepareAndFinalize.output_is_reduced", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepEPHTPrepareAndFinalize.max_num_tokens_per_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepEPHTPrepareAndFinalize.topk_indices_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepEPHTPrepareAndFinalize._get_dispatch_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepEPHTPrepareAndFinalize._get_combine_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepEPHTPrepareAndFinalize._do_dispatch", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "DeepEPHTPrepareAndFinalize._receiver", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "DeepEPHTPrepareAndFinalize.supports_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepEPHTPrepareAndFinalize.prepare_async", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "DeepEPHTPrepareAndFinalize.prepare", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "DeepEPHTPrepareAndFinalize._finalize", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "DeepEPHTPrepareAndFinalize.finalize_async", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "DeepEPHTPrepareAndFinalize.finalize", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "DeepEPHTPrepareAndFinalize.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "DeepEPHTPrepareAndFinalize.buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepEPHTPrepareAndFinalize.num_dispatchers_", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepEPHTPrepareAndFinalize.dp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepEPHTPrepareAndFinalize.rank_expert_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepEPHTPrepareAndFinalize.async_prepare", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepEPHTPrepareAndFinalize.handles", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepEPHTPrepareAndFinalize.available_rank_configs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 83, "n_typed": 75, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 59, "n_attrs": 7, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.deepep_ht_prepare_finalize", "names": [ "vllm.model_executor.layers.fused_moe.deepep_ht_prepare_finalize.DeepEPHTPrepareAndFinalize" ], "n_typable": 83, "n_typed": 75, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 59, "n_classes": 1, "n_attrs": 7, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/deepep_ll_prepare_finalize.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.deepep_ll_prepare_finalize.DeepEPLLPrepareAndFinalize", "methods": [ { "kind": "function", "name": "DeepEPLLPrepareAndFinalize.maybe_roundup_layer_hidden_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize.post_init_setup", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize.num_dispatchers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize.output_is_reduced", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize.max_num_tokens_per_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize.topk_indices_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize._map_global_to_physical_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize._map_local_to_global_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize._do_quant", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize.supports_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize.prepare_async", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize._receiver", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize.prepare", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize._finalize", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize.finalize_async", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "DeepEPLLPrepareAndFinalize.finalize", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "DeepEPLLPrepareAndFinalize.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "DeepEPLLPrepareAndFinalize.SUPPORTED_HIDDEN_SIZES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepEPLLPrepareAndFinalize.buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepEPLLPrepareAndFinalize.max_tokens_per_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepEPLLPrepareAndFinalize.use_fp8_dispatch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepEPLLPrepareAndFinalize.handles", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepEPLLPrepareAndFinalize.num_dispatchers_", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepEPLLPrepareAndFinalize.global_to_physical", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepEPLLPrepareAndFinalize.physical_to_global", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepEPLLPrepareAndFinalize.local_expert_global_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepEPLLPrepareAndFinalize.use_ue8m0_dispatch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 81, "n_typed": 71, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 54, "n_attrs": 10, "n_properties": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.deepep_ll_prepare_finalize.dequant_fp8", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.deepep_ll_prepare_finalize.DEEPEP_QUANT_BLOCK_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.deepep_ll_prepare_finalize.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.deepep_ll_prepare_finalize.DEEPEP_QUANT_BLOCK_SHAPE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.deepep_ll_prepare_finalize", "names": [ "vllm.model_executor.layers.fused_moe.deepep_ll_prepare_finalize.DEEPEP_QUANT_BLOCK_SHAPE", "vllm.model_executor.layers.fused_moe.deepep_ll_prepare_finalize.DEEPEP_QUANT_BLOCK_SIZE", "vllm.model_executor.layers.fused_moe.deepep_ll_prepare_finalize.DeepEPLLPrepareAndFinalize", "vllm.model_executor.layers.fused_moe.deepep_ll_prepare_finalize.dequant_fp8", "vllm.model_executor.layers.fused_moe.deepep_ll_prepare_finalize.logger" ], "n_typable": 85, "n_typed": 74, "n_any": 0, "n_untyped": 11, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 54, "n_classes": 1, "n_attrs": 13, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/experts/trtllm_fp8_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.experts.trtllm_fp8_moe.TrtLlmFp8Experts", "methods": [ { "kind": "function", "name": "TrtLlmFp8Experts.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TrtLlmFp8Experts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmFp8Experts._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmFp8Experts._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmFp8Experts._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TrtLlmFp8Experts._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TrtLlmFp8Experts._supports_routing_method", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TrtLlmFp8Experts._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TrtLlmFp8Experts._supports_router_logits_dtype", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TrtLlmFp8Experts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmFp8Experts.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmFp8Experts._apply_per_block", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "TrtLlmFp8Experts._apply_per_tensor", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "TrtLlmFp8Experts.apply", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TrtLlmFp8Experts.routing_method_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmFp8Experts.topk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmFp8Experts.intermediate_size_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmFp8Experts.hidden_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmFp8Experts.local_num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmFp8Experts.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 70, "n_typed": 63, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 50, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.experts.trtllm_fp8_moe", "names": [ "vllm.model_executor.layers.fused_moe.experts.trtllm_fp8_moe.TrtLlmFp8Experts" ], "n_typable": 70, "n_typed": 63, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 50, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/experts/trtllm_nvfp4_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.experts.trtllm_nvfp4_moe.TrtLlmNvFp4ExpertsModular", "methods": [ { "kind": "function", "name": "TrtLlmNvFp4ExpertsModular._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TrtLlmNvFp4ExpertsModular.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "TrtLlmNvFp4ExpertsModular.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmNvFp4ExpertsModular.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [], "attrs": [], "n_typable": 28, "n_typed": 27, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 24, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.experts.trtllm_nvfp4_moe.TrtLlmNvFp4ExpertsMonolithic", "methods": [ { "kind": "function", "name": "TrtLlmNvFp4ExpertsMonolithic._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TrtLlmNvFp4ExpertsMonolithic._supports_routing_method", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TrtLlmNvFp4ExpertsMonolithic._supports_router_logits_dtype", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TrtLlmNvFp4ExpertsMonolithic.apply", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 } ], "properties": [], "attrs": [], "n_typable": 23, "n_typed": 23, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 19, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.experts.trtllm_nvfp4_moe.TrtLlmNvFp4ExpertsBase", "methods": [ { "kind": "function", "name": "TrtLlmNvFp4ExpertsBase.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TrtLlmNvFp4ExpertsBase._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmNvFp4ExpertsBase._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmNvFp4ExpertsBase._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TrtLlmNvFp4ExpertsBase._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TrtLlmNvFp4ExpertsBase._supports_shape", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TrtLlmNvFp4ExpertsBase.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmNvFp4ExpertsBase.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmNvFp4ExpertsBase.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TrtLlmNvFp4ExpertsBase.moe_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmNvFp4ExpertsBase.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmNvFp4ExpertsBase.routing_method_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmNvFp4ExpertsBase.topk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmNvFp4ExpertsBase.intermediate_size_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmNvFp4ExpertsBase.hidden_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmNvFp4ExpertsBase.local_num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmNvFp4ExpertsBase.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmNvFp4ExpertsBase.g1_scale_c", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 14, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 6, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.experts.trtllm_nvfp4_moe", "names": [ "vllm.model_executor.layers.fused_moe.experts.trtllm_nvfp4_moe.TrtLlmNvFp4ExpertsBase", "vllm.model_executor.layers.fused_moe.experts.trtllm_nvfp4_moe.TrtLlmNvFp4ExpertsModular", "vllm.model_executor.layers.fused_moe.experts.trtllm_nvfp4_moe.TrtLlmNvFp4ExpertsMonolithic" ], "n_typable": 75, "n_typed": 64, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 49, "n_classes": 3, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/fallback.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.fallback.FallbackExperts", "methods": [ { "kind": "function", "name": "FallbackExperts.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FallbackExperts.get_clses", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FallbackExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FallbackExperts._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FallbackExperts._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FallbackExperts._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FallbackExperts._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FallbackExperts._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FallbackExperts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FallbackExperts.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FallbackExperts.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FallbackExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "FallbackExperts._select_experts_impl", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FallbackExperts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FallbackExperts.fallback_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FallbackExperts.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 48, "n_typed": 44, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 32, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.fallback", "names": [ "vllm.model_executor.layers.fused_moe.fallback.FallbackExperts" ], "n_typable": 48, "n_typed": 44, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 32, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/flashinfer_a2a_prepare_finalize.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.flashinfer_a2a_prepare_finalize.get_local_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.flashinfer_a2a_prepare_finalize.flashinfer_alltoall_dispatch", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.flashinfer_a2a_prepare_finalize.FlashInferA2APrepareAndFinalize", "methods": [ { "kind": "function", "name": "FlashInferA2APrepareAndFinalize.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferA2APrepareAndFinalize.max_num_tokens_per_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferA2APrepareAndFinalize.topk_indices_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferA2APrepareAndFinalize.num_dispatchers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferA2APrepareAndFinalize.output_is_reduced", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferA2APrepareAndFinalize._apply_router_weight_on_input", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashInferA2APrepareAndFinalize.prepare", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "FlashInferA2APrepareAndFinalize.finalize", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "FlashInferA2APrepareAndFinalize.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FlashInferA2APrepareAndFinalize.num_dispatchers_", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferA2APrepareAndFinalize.all2all_manager", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 27, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 19, "n_attrs": 2, "n_properties": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.flashinfer_a2a_prepare_finalize.flashinfer_alltoall_combine", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.flashinfer_a2a_prepare_finalize", "names": [ "vllm.model_executor.layers.fused_moe.flashinfer_a2a_prepare_finalize.FlashInferA2APrepareAndFinalize", "vllm.model_executor.layers.fused_moe.flashinfer_a2a_prepare_finalize.flashinfer_alltoall_combine", "vllm.model_executor.layers.fused_moe.flashinfer_a2a_prepare_finalize.flashinfer_alltoall_dispatch", "vllm.model_executor.layers.fused_moe.flashinfer_a2a_prepare_finalize.get_local_sizes" ], "n_typable": 48, "n_typed": 41, "n_any": 0, "n_untyped": 7, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 15, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 19, "n_classes": 1, "n_attrs": 2, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/flashinfer_cutedsl_moe.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.flashinfer_cutedsl_moe.flashinfer_cutedsl_moe_masked", "n_typed": 10, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.flashinfer_cutedsl_moe.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.flashinfer_cutedsl_moe.get_cute_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.flashinfer_cutedsl_moe.FlashInferCuteDSLExperts", "methods": [ { "kind": "function", "name": "FlashInferCuteDSLExperts.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashInferCuteDSLExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferCuteDSLExperts._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferCuteDSLExperts._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferCuteDSLExperts._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlashInferCuteDSLExperts._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferCuteDSLExperts._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferCuteDSLExperts.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferCuteDSLExperts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferCuteDSLExperts.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferCuteDSLExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "FlashInferCuteDSLExperts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferCuteDSLExperts.out_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 44, "n_typed": 41, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 31, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.flashinfer_cutedsl_moe", "names": [ "vllm.model_executor.layers.fused_moe.flashinfer_cutedsl_moe.FlashInferCuteDSLExperts", "vllm.model_executor.layers.fused_moe.flashinfer_cutedsl_moe.flashinfer_cutedsl_moe_masked", "vllm.model_executor.layers.fused_moe.flashinfer_cutedsl_moe.get_cute_dtype", "vllm.model_executor.layers.fused_moe.flashinfer_cutedsl_moe.logger" ], "n_typable": 60, "n_typed": 53, "n_any": 0, "n_untyped": 7, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 13, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 31, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/flashinfer_cutlass_moe.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.flashinfer_cutlass_moe.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.flashinfer_cutlass_moe.is_valid_flashinfer_cutlass_fused_moe", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.flashinfer_cutlass_moe.FlashInferExperts", "methods": [ { "kind": "function", "name": "FlashInferExperts.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlashInferExperts._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferExperts._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferExperts._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlashInferExperts._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferExperts._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferExperts.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferExperts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferExperts.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "FlashInferExperts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "FlashInferExperts.moe_sum", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "FlashInferExperts.expects_unquantized_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FlashInferExperts.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferExperts.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferExperts.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferExperts.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferExperts.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferExperts.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferExperts.out_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferExperts.use_dp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferExperts.use_deepseek_fp8_block_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferExperts.max_capture_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferExperts.gemm1_alpha", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferExperts.gemm1_beta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferExperts.gemm1_clamp_limit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferExperts.fake_input_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 59, "n_typed": 43, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 31, "n_attrs": 14, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.flashinfer_cutlass_moe", "names": [ "vllm.model_executor.layers.fused_moe.flashinfer_cutlass_moe.FlashInferExperts", "vllm.model_executor.layers.fused_moe.flashinfer_cutlass_moe.is_valid_flashinfer_cutlass_fused_moe", "vllm.model_executor.layers.fused_moe.flashinfer_cutlass_moe.logger" ], "n_typable": 64, "n_typed": 47, "n_any": 0, "n_untyped": 17, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 31, "n_classes": 1, "n_attrs": 15, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/flashinfer_trtllm_moe.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.flashinfer_trtllm_moe.flashinfer_fused_moe_bf16_fake", "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.flashinfer_trtllm_moe.is_supported_config_trtllm_bf16", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.flashinfer_trtllm_moe.flashinfer_fused_moe_bf16", "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.flashinfer_trtllm_moe", "names": [ "vllm.model_executor.layers.fused_moe.flashinfer_trtllm_moe.flashinfer_fused_moe_bf16", "vllm.model_executor.layers.fused_moe.flashinfer_trtllm_moe.flashinfer_fused_moe_bf16_fake", "vllm.model_executor.layers.fused_moe.flashinfer_trtllm_moe.is_supported_config_trtllm_bf16" ], "n_typable": 33, "n_typed": 33, "n_any": 0, "n_untyped": 0, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 30, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/fused_marlin_moe.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_marlin_moe.fused_marlin_moe", "n_typed": 34, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 34, "n_params": 33, "n_function_overloads": 1, "n_function_params": 33 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.fused_marlin_moe.MarlinExpertsBase", "methods": [ { "kind": "function", "name": "MarlinExpertsBase.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "MarlinExpertsBase._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MarlinExpertsBase._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MarlinExpertsBase._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MarlinExpertsBase._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MarlinExpertsBase._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MarlinExpertsBase.moe_problem_size", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "MarlinExpertsBase.quant_type_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MarlinExpertsBase.w13_g_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MarlinExpertsBase.w2_g_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MarlinExpertsBase.w13_g_idx_sort_indices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MarlinExpertsBase.w2_g_idx_sort_indices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MarlinExpertsBase.is_k_full", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MarlinExpertsBase.input_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 24, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 17, "n_attrs": 6, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.fused_marlin_moe.BatchedMarlinExperts", "methods": [ { "kind": "function", "name": "BatchedMarlinExperts.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "BatchedMarlinExperts.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedMarlinExperts.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedMarlinExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedMarlinExperts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchedMarlinExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "BatchedMarlinExperts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [], "attrs": [], "n_typable": 39, "n_typed": 37, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 32, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.fused_marlin_moe.batched_fused_marlin_moe", "n_typed": 28, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 28, "n_params": 27, "n_function_overloads": 1, "n_function_params": 27 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.fused_marlin_moe.MarlinExperts", "methods": [ { "kind": "function", "name": "MarlinExperts.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MarlinExperts.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MarlinExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MarlinExperts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MarlinExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "MarlinExperts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "MarlinExperts.moe_sum", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 32, "n_typed": 31, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 25, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.fused_marlin_moe", "names": [ "vllm.model_executor.layers.fused_moe.fused_marlin_moe.BatchedMarlinExperts", "vllm.model_executor.layers.fused_moe.fused_marlin_moe.MarlinExperts", "vllm.model_executor.layers.fused_moe.fused_marlin_moe.MarlinExpertsBase", "vllm.model_executor.layers.fused_moe.fused_marlin_moe.batched_fused_marlin_moe", "vllm.model_executor.layers.fused_moe.fused_marlin_moe.fused_marlin_moe" ], "n_typable": 164, "n_typed": 154, "n_any": 0, "n_untyped": 10, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 60, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 74, "n_classes": 3, "n_attrs": 6, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/fused_moe_modular_method.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.fused_moe_modular_method.FusedMoEModularMethod", "methods": [ { "kind": "function", "name": "FusedMoEModularMethod.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoEModularMethod.make", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FusedMoEModularMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FusedMoEModularMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FusedMoEModularMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [ { "kind": "property", "name": "FusedMoEModularMethod.supports_eplb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FusedMoEModularMethod.method_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FusedMoEModularMethod.moe_quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEModularMethod.moe_kernel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEModularMethod.disable_expert_map", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEModularMethod.old_quant_method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 23, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 19, "n_attrs": 4, "n_properties": 2 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.fused_moe_modular_method.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.fused_moe_modular_method", "names": [ "vllm.model_executor.layers.fused_moe.fused_moe_modular_method.FusedMoEModularMethod", "vllm.model_executor.layers.fused_moe.fused_moe_modular_method.logger" ], "n_typable": 31, "n_typed": 23, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 19, "n_classes": 1, "n_attrs": 5, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/gpt_oss_triton_kernels_moe.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.pack_bitmatrix", "n_typed": 3, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.legacy_routing", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.triton_kernel_fused_mxfp4_w4a8_experts", "n_typed": 11, "n_any": 0, "n_untyped": 9, "n_overloads": 1, "n_typable": 20, "n_params": 19, "n_function_overloads": 1, "n_function_params": 19 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.triton_kernel_moe_forward", "n_typed": 10, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.use_legacy_triton_kernels", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.OAITritonExperts", "methods": [ { "kind": "function", "name": "OAITritonExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OAITritonExperts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OAITritonExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "OAITritonExperts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [], "attrs": [], "n_typable": 27, "n_typed": 26, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 23, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.UnfusedOAITritonExperts", "methods": [ { "kind": "function", "name": "UnfusedOAITritonExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UnfusedOAITritonExperts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UnfusedOAITritonExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "UnfusedOAITritonExperts.moe_sum", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "UnfusedOAITritonExperts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [], "attrs": [], "n_typable": 30, "n_typed": 28, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 25, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.BaseOAITritonExperts", "methods": [ { "kind": "function", "name": "BaseOAITritonExperts._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseOAITritonExperts._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseOAITritonExperts._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseOAITritonExperts._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseOAITritonExperts._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseOAITritonExperts.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseOAITritonExperts.moe_problem_size", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaseOAITritonExperts.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseOAITritonExperts._make_routing_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 20, "n_typed": 20, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.legacy_routing_from_bitmatrix", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.make_routing_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.triton_kernel_fused_experts", "n_typed": 13, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe", "names": [ "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.BaseOAITritonExperts", "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.OAITritonExperts", "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.UnfusedOAITritonExperts", "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.legacy_routing", "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.legacy_routing_from_bitmatrix", "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.logger", "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.make_routing_data", "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.pack_bitmatrix", "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.triton_kernel_fused_experts", "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.triton_kernel_fused_mxfp4_w4a8_experts", "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.triton_kernel_moe_forward", "vllm.model_executor.layers.fused_moe.gpt_oss_triton_kernels_moe.use_legacy_triton_kernels" ], "n_typable": 154, "n_typed": 125, "n_any": 0, "n_untyped": 29, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 69, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 59, "n_classes": 3, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/moe_align_block_size.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.moe_align_block_size.moe_align_block_size", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.moe_align_block_size.batched_moe_align_block_size", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.moe_align_block_size", "names": [ "vllm.model_executor.layers.fused_moe.moe_align_block_size.batched_moe_align_block_size", "vllm.model_executor.layers.fused_moe.moe_align_block_size.moe_align_block_size" ], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 9, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/moe_permute_unpermute.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.moe_permute_unpermute.moe_permute_unpermute_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.moe_permute_unpermute.moe_permute", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.moe_permute_unpermute.moe_unpermute", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.moe_permute_unpermute", "names": [ "vllm.model_executor.layers.fused_moe.moe_permute_unpermute.moe_permute", "vllm.model_executor.layers.fused_moe.moe_permute_unpermute.moe_permute_unpermute_supported", "vllm.model_executor.layers.fused_moe.moe_permute_unpermute.moe_unpermute" ], "n_typable": 15, "n_typed": 14, "n_any": 0, "n_untyped": 1, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 12, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/mori_prepare_finalize.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.mori_prepare_finalize.MoriPrepareAndFinalize", "methods": [ { "kind": "function", "name": "MoriPrepareAndFinalize.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MoriPrepareAndFinalize.output_is_reduced", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoriPrepareAndFinalize.num_dispatchers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoriPrepareAndFinalize.max_num_tokens_per_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoriPrepareAndFinalize.topk_indices_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoriPrepareAndFinalize.supports_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoriPrepareAndFinalize.prepare", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "MoriPrepareAndFinalize.finalize", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "MoriPrepareAndFinalize.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MoriPrepareAndFinalize.mori_op", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoriPrepareAndFinalize.num_dispatchers_", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoriPrepareAndFinalize.max_tokens_per_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoriPrepareAndFinalize.use_fp8_dispatch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 25, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 18, "n_attrs": 4, "n_properties": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.mori_prepare_finalize.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.mori_prepare_finalize", "names": [ "vllm.model_executor.layers.fused_moe.mori_prepare_finalize.MoriPrepareAndFinalize", "vllm.model_executor.layers.fused_moe.mori_prepare_finalize.logger" ], "n_typable": 32, "n_typed": 25, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 18, "n_classes": 1, "n_attrs": 5, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/oracle/fp8.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.oracle.fp8.Fp8MoeBackend", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Fp8MoeBackend.NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Fp8MoeBackend.FLASHINFER_TRTLLM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Fp8MoeBackend.FLASHINFER_CUTLASS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Fp8MoeBackend.DEEPGEMM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Fp8MoeBackend.BATCHED_DEEPGEMM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Fp8MoeBackend.MARLIN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Fp8MoeBackend.TRITON", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Fp8MoeBackend.BATCHED_TRITON", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Fp8MoeBackend.AITER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Fp8MoeBackend.VLLM_CUTLASS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Fp8MoeBackend.BATCHED_VLLM_CUTLASS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Fp8MoeBackend.XPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 12, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.fp8.backend_to_kernel_cls", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.fp8.map_fp8_backend", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.fp8.make_fp8_moe_quant_config", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.fp8.convert_to_fp8_moe_kernel_format", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.fp8.make_fp8_moe_kernel", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.fp8.select_fp8_moe_backend", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.oracle.fp8.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.oracle.fp8", "names": [ "vllm.model_executor.layers.fused_moe.oracle.fp8.Fp8MoeBackend", "vllm.model_executor.layers.fused_moe.oracle.fp8.backend_to_kernel_cls", "vllm.model_executor.layers.fused_moe.oracle.fp8.convert_to_fp8_moe_kernel_format", "vllm.model_executor.layers.fused_moe.oracle.fp8.logger", "vllm.model_executor.layers.fused_moe.oracle.fp8.make_fp8_moe_kernel", "vllm.model_executor.layers.fused_moe.oracle.fp8.make_fp8_moe_quant_config", "vllm.model_executor.layers.fused_moe.oracle.fp8.map_fp8_backend", "vllm.model_executor.layers.fused_moe.oracle.fp8.select_fp8_moe_backend" ], "n_typable": 35, "n_typed": 34, "n_any": 0, "n_untyped": 1, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 28, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/oracle/nvfp4.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.nvfp4.make_nvfp4_moe_kernel", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.nvfp4.make_mxfp4_moe_quant_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.nvfp4.backend_to_kernel_cls", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.oracle.nvfp4.FLASHINFER_NVFP4_MOE_BACKENDS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.oracle.nvfp4.NvFp4MoeBackend", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NvFp4MoeBackend.FLASHINFER_TRTLLM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NvFp4MoeBackend.FLASHINFER_CUTLASS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NvFp4MoeBackend.FLASHINFER_CUTEDSL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NvFp4MoeBackend.VLLM_CUTLASS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NvFp4MoeBackend.MARLIN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.nvfp4.map_nvfp4_backend", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.nvfp4.is_global_sf_supported_for_nvfp4_backend", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.nvfp4.make_nvfp4_moe_quant_config", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.oracle.nvfp4.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.oracle.nvfp4.fi_2_vllm_backend_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.nvfp4.select_nvfp4_moe_backend", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.nvfp4.convert_to_nvfp4_moe_kernel_format", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.oracle.nvfp4", "names": [ "vllm.model_executor.layers.fused_moe.oracle.nvfp4.FLASHINFER_NVFP4_MOE_BACKENDS", "vllm.model_executor.layers.fused_moe.oracle.nvfp4.NvFp4MoeBackend", "vllm.model_executor.layers.fused_moe.oracle.nvfp4.backend_to_kernel_cls", "vllm.model_executor.layers.fused_moe.oracle.nvfp4.convert_to_nvfp4_moe_kernel_format", "vllm.model_executor.layers.fused_moe.oracle.nvfp4.fi_2_vllm_backend_map", "vllm.model_executor.layers.fused_moe.oracle.nvfp4.is_global_sf_supported_for_nvfp4_backend", "vllm.model_executor.layers.fused_moe.oracle.nvfp4.logger", "vllm.model_executor.layers.fused_moe.oracle.nvfp4.make_mxfp4_moe_quant_config", "vllm.model_executor.layers.fused_moe.oracle.nvfp4.make_nvfp4_moe_kernel", "vllm.model_executor.layers.fused_moe.oracle.nvfp4.make_nvfp4_moe_quant_config", "vllm.model_executor.layers.fused_moe.oracle.nvfp4.map_nvfp4_backend", "vllm.model_executor.layers.fused_moe.oracle.nvfp4.select_nvfp4_moe_backend" ], "n_typable": 41, "n_typed": 40, "n_any": 0, "n_untyped": 1, "n_functions": 8, "n_function_overloads": 8, "n_function_params": 31, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/oracle/unquantized.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.oracle.unquantized.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.unquantized.convert_to_unquantized_kernel_format", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.unquantized.map_unquantized_backend", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.oracle.unquantized.UnquantizedMoeBackend", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "UnquantizedMoeBackend.FLASHINFER_TRTLLM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UnquantizedMoeBackend.FLASHINFER_CUTLASS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UnquantizedMoeBackend.AITER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UnquantizedMoeBackend.TRITON", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UnquantizedMoeBackend.CPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UnquantizedMoeBackend.XPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UnquantizedMoeBackend.TPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UnquantizedMoeBackend.OOT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.unquantized.select_unquantized_moe_backend", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.oracle.unquantized.UNSUPPORTED_BACKEND", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.oracle.unquantized.make_unquantized_moe_kernel", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.oracle.unquantized", "names": [ "vllm.model_executor.layers.fused_moe.oracle.unquantized.UNSUPPORTED_BACKEND", "vllm.model_executor.layers.fused_moe.oracle.unquantized.UnquantizedMoeBackend", "vllm.model_executor.layers.fused_moe.oracle.unquantized.convert_to_unquantized_kernel_format", "vllm.model_executor.layers.fused_moe.oracle.unquantized.logger", "vllm.model_executor.layers.fused_moe.oracle.unquantized.make_unquantized_moe_kernel", "vllm.model_executor.layers.fused_moe.oracle.unquantized.map_unquantized_backend", "vllm.model_executor.layers.fused_moe.oracle.unquantized.select_unquantized_moe_backend" ], "n_typable": 16, "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 11, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/prepare_finalize/naive_dp_ep.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.prepare_finalize.naive_dp_ep.MoEPrepareAndFinalizeNaiveDPEPMonolithic", "methods": [ { "kind": "function", "name": "MoEPrepareAndFinalizeNaiveDPEPMonolithic.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNaiveDPEPMonolithic.max_num_tokens_per_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNaiveDPEPMonolithic.topk_indices_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNaiveDPEPMonolithic.num_dispatchers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNaiveDPEPMonolithic.output_is_reduced", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNaiveDPEPMonolithic.prepare", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNaiveDPEPMonolithic.finalize", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "MoEPrepareAndFinalizeNaiveDPEPMonolithic.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MoEPrepareAndFinalizeNaiveDPEPMonolithic.is_sequence_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 7, "n_attrs": 1, "n_properties": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.prepare_finalize.naive_dp_ep.make_moe_prepare_and_finalize_naive_dp_ep", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.prepare_finalize.naive_dp_ep.MoEPrepareAndFinalizeNaiveDPEPModular", "methods": [ { "kind": "function", "name": "MoEPrepareAndFinalizeNaiveDPEPModular.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNaiveDPEPModular.max_num_tokens_per_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNaiveDPEPModular.topk_indices_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNaiveDPEPModular.num_dispatchers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNaiveDPEPModular.output_is_reduced", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNaiveDPEPModular.prepare", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNaiveDPEPModular.finalize", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "MoEPrepareAndFinalizeNaiveDPEPModular.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MoEPrepareAndFinalizeNaiveDPEPModular.is_sequence_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 24, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 16, "n_attrs": 1, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.prepare_finalize.naive_dp_ep", "names": [ "vllm.model_executor.layers.fused_moe.prepare_finalize.naive_dp_ep.MoEPrepareAndFinalizeNaiveDPEPModular", "vllm.model_executor.layers.fused_moe.prepare_finalize.naive_dp_ep.MoEPrepareAndFinalizeNaiveDPEPMonolithic", "vllm.model_executor.layers.fused_moe.prepare_finalize.naive_dp_ep.make_moe_prepare_and_finalize_naive_dp_ep" ], "n_typable": 45, "n_typed": 43, "n_any": 0, "n_untyped": 2, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 23, "n_classes": 2, "n_attrs": 2, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/prepare_finalize/no_dp_ep.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.prepare_finalize.no_dp_ep.make_moe_prepare_and_finalize_no_dp_ep", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.prepare_finalize.no_dp_ep.MoEPrepareAndFinalizeNoDPEPMonolithic", "methods": [ { "kind": "function", "name": "MoEPrepareAndFinalizeNoDPEPMonolithic.max_num_tokens_per_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNoDPEPMonolithic.topk_indices_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNoDPEPMonolithic.num_dispatchers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNoDPEPMonolithic.output_is_reduced", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNoDPEPMonolithic.prepare", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNoDPEPMonolithic.finalize", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "MoEPrepareAndFinalizeNoDPEPMonolithic.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 5, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.prepare_finalize.no_dp_ep.MoEPrepareAndFinalizeNoDPEPModular", "methods": [ { "kind": "function", "name": "MoEPrepareAndFinalizeNoDPEPModular.max_num_tokens_per_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNoDPEPModular.topk_indices_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNoDPEPModular.num_dispatchers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNoDPEPModular.output_is_reduced", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNoDPEPModular.prepare", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "MoEPrepareAndFinalizeNoDPEPModular.finalize", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "MoEPrepareAndFinalizeNoDPEPModular.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 21, "n_typed": 21, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_attrs": 0, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.prepare_finalize.no_dp_ep", "names": [ "vllm.model_executor.layers.fused_moe.prepare_finalize.no_dp_ep.MoEPrepareAndFinalizeNoDPEPModular", "vllm.model_executor.layers.fused_moe.prepare_finalize.no_dp_ep.MoEPrepareAndFinalizeNoDPEPMonolithic", "vllm.model_executor.layers.fused_moe.prepare_finalize.no_dp_ep.make_moe_prepare_and_finalize_no_dp_ep" ], "n_typable": 35, "n_typed": 35, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 19, "n_classes": 2, "n_attrs": 0, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/routed_experts_capturer.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.routed_experts_capturer.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.routed_experts_capturer.RoutedExpertsReader", "methods": [ { "kind": "function", "name": "RoutedExpertsReader.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RoutedExpertsReader.create", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RoutedExpertsReader.get_instance", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RoutedExpertsReader.attach_buffer", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RoutedExpertsReader.get_routed_experts", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RoutedExpertsReader.cleanup", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RoutedExpertsReader.__del__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RoutedExpertsReader._instance", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.routed_experts_capturer.RoutedExpertsCapturer", "methods": [ { "kind": "function", "name": "RoutedExpertsCapturer.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RoutedExpertsCapturer.create", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RoutedExpertsCapturer.get_instance", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RoutedExpertsCapturer.init_buffer", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RoutedExpertsCapturer.capture", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RoutedExpertsCapturer.clear_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RoutedExpertsCapturer.save_captured_experts", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RoutedExpertsCapturer.cleanup", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RoutedExpertsCapturer.__del__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RoutedExpertsCapturer._instance", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.routed_experts_capturer", "names": [ "vllm.model_executor.layers.fused_moe.routed_experts_capturer.RoutedExpertsCapturer", "vllm.model_executor.layers.fused_moe.routed_experts_capturer.RoutedExpertsReader", "vllm.model_executor.layers.fused_moe.routed_experts_capturer.logger" ], "n_typable": 28, "n_typed": 27, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 9, "n_classes": 2, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/router/base_router.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.router.base_router.eplb_map_to_physical_and_record", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.router.base_router.BaseRouter", "methods": [ { "kind": "function", "name": "BaseRouter.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BaseRouter.set_capture_fn", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseRouter._validate_eplb_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseRouter._get_indices_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseRouter._apply_eplb_mapping", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseRouter._convert_indices_dtype", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseRouter._compute_routing", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseRouter.select_experts", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseRouter.top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseRouter.global_num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseRouter.eplb_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseRouter.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseRouter.indices_type_getter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseRouter.capture_fn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 28, "n_typed": 22, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 14, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.router.base_router", "names": [ "vllm.model_executor.layers.fused_moe.router.base_router.BaseRouter", "vllm.model_executor.layers.fused_moe.router.base_router.eplb_map_to_physical_and_record" ], "n_typable": 33, "n_typed": 27, "n_any": 0, "n_untyped": 6, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 14, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/router/custom_routing_router.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.router.custom_routing_router.CustomRoutingRouter", "methods": [ { "kind": "function", "name": "CustomRoutingRouter.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "CustomRoutingRouter._compute_routing", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "CustomRoutingRouter.routing_method_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "CustomRoutingRouter.custom_routing_function", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CustomRoutingRouter.renormalize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 12, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 2, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.router.custom_routing_router", "names": [ "vllm.model_executor.layers.fused_moe.router.custom_routing_router.CustomRoutingRouter" ], "n_typable": 15, "n_typed": 12, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_classes": 1, "n_attrs": 2, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/router/fused_topk_bias_router.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.router.fused_topk_bias_router.vllm_topk_softmax", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.router.fused_topk_bias_router.vllm_topk_sigmoid", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.router.fused_topk_bias_router.FusedTopKBiasRouter", "methods": [ { "kind": "function", "name": "FusedTopKBiasRouter.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "FusedTopKBiasRouter._compute_routing", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "FusedTopKBiasRouter.routing_method_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FusedTopKBiasRouter.e_score_correction_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedTopKBiasRouter.renormalize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedTopKBiasRouter.scoring_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedTopKBiasRouter.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 14, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_attrs": 4, "n_properties": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.router.fused_topk_bias_router.fused_topk_bias", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.router.fused_topk_bias_router", "names": [ "vllm.model_executor.layers.fused_moe.router.fused_topk_bias_router.FusedTopKBiasRouter", "vllm.model_executor.layers.fused_moe.router.fused_topk_bias_router.fused_topk_bias", "vllm.model_executor.layers.fused_moe.router.fused_topk_bias_router.vllm_topk_sigmoid", "vllm.model_executor.layers.fused_moe.router.fused_topk_bias_router.vllm_topk_softmax" ], "n_typable": 41, "n_typed": 35, "n_any": 0, "n_untyped": 6, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 19, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_classes": 1, "n_attrs": 4, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/router/fused_topk_router.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.router.fused_topk_router.vllm_topk_sigmoid", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.router.fused_topk_router.dispatch_topk_softmax_func", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.router.fused_topk_router.fused_topk", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.router.fused_topk_router.FusedTopKRouter", "methods": [ { "kind": "function", "name": "FusedTopKRouter.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "FusedTopKRouter._compute_routing", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "FusedTopKRouter.routing_method_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FusedTopKRouter.renormalize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedTopKRouter.scoring_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 12, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 2, "n_properties": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.router.fused_topk_router.dispatch_topk_sigmoid_func", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.router.fused_topk_router.vllm_topk_softmax", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.router.fused_topk_router", "names": [ "vllm.model_executor.layers.fused_moe.router.fused_topk_router.FusedTopKRouter", "vllm.model_executor.layers.fused_moe.router.fused_topk_router.dispatch_topk_sigmoid_func", "vllm.model_executor.layers.fused_moe.router.fused_topk_router.dispatch_topk_softmax_func", "vllm.model_executor.layers.fused_moe.router.fused_topk_router.fused_topk", "vllm.model_executor.layers.fused_moe.router.fused_topk_router.vllm_topk_sigmoid", "vllm.model_executor.layers.fused_moe.router.fused_topk_router.vllm_topk_softmax" ], "n_typable": 38, "n_typed": 35, "n_any": 0, "n_untyped": 3, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 18, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_classes": 1, "n_attrs": 2, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/router/router_factory.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.router.router_factory.create_fused_moe_router", "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.router.router_factory.EMPTY_EPLB_STATE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.router.router_factory", "names": [ "vllm.model_executor.layers.fused_moe.router.router_factory.EMPTY_EPLB_STATE", "vllm.model_executor.layers.fused_moe.router.router_factory.create_fused_moe_router" ], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 14, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/router/routing_simulator_router.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.router.routing_simulator_router.RoutingSimulator", "methods": [ { "kind": "function", "name": "RoutingSimulator.register_strategy", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RoutingSimulator.get_available_strategies", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RoutingSimulator.simulate_routing", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RoutingSimulator._routing_strategies", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 11, "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.router.routing_simulator_router.RoutingSimulatorRouter", "methods": [ { "kind": "function", "name": "RoutingSimulatorRouter.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "RoutingSimulatorRouter._compute_routing", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "RoutingSimulatorRouter.routing_method_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 11, "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.router.routing_simulator_router.DistributionBasedRouting", "methods": [ { "kind": "function", "name": "DistributionBasedRouting.__init__", "n_typed": 1, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DistributionBasedRouting._validate_distribution_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DistributionBasedRouting.route_tokens", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DistributionBasedRouting._sample_expert_ids", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DistributionBasedRouting._sample_continuous_distribution", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DistributionBasedRouting._normalize_samples", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DistributionBasedRouting._generate_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DistributionBasedRouting.get_distribution_info", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DistributionBasedRouting.distribution", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DistributionBasedRouting.distribution_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 23, "n_any": 1, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 18, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.router.routing_simulator_router.RoutingStrategy", "methods": [ { "kind": "function", "name": "RoutingStrategy.route_tokens", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.router.routing_simulator_router.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.router.routing_simulator_router", "names": [ "vllm.model_executor.layers.fused_moe.router.routing_simulator_router.DistributionBasedRouting", "vllm.model_executor.layers.fused_moe.router.routing_simulator_router.RoutingSimulator", "vllm.model_executor.layers.fused_moe.router.routing_simulator_router.RoutingSimulatorRouter", "vllm.model_executor.layers.fused_moe.router.routing_simulator_router.RoutingStrategy", "vllm.model_executor.layers.fused_moe.router.routing_simulator_router.logger" ], "n_typable": 56, "n_typed": 48, "n_any": 1, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 37, "n_classes": 4, "n_attrs": 4, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/runner/default_moe_runner.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.runner.default_moe_runner.get_layer_from_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.fused_moe.runner.default_moe_runner.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.runner.default_moe_runner.DefaultMoERunner", "methods": [ { "kind": "function", "name": "DefaultMoERunner.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "DefaultMoERunner._maybe_setup_shared_experts_stream", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DefaultMoERunner.ensure_dp_chunking_init", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DefaultMoERunner.must_reduce_shared_expert_outputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DefaultMoERunner.maybe_all_reduce_tensor_model_parallel", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DefaultMoERunner.apply_routed_input_transform", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DefaultMoERunner._reduce_output", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DefaultMoERunner._encode_layer_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DefaultMoERunner.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DefaultMoERunner.forward_impl_chunked", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DefaultMoERunner.forward_impl", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "DefaultMoERunner.use_dp_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "DefaultMoERunner.moe_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultMoERunner.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultMoERunner.routed_input_transform", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultMoERunner.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultMoERunner.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultMoERunner.quant_method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultMoERunner.reduce_results", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultMoERunner.enable_dbo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultMoERunner.layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultMoERunner.batched_hidden_states", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DefaultMoERunner.batched_router_logits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DefaultMoERunner.shared_experts_stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultMoERunner.moe_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 53, "n_typed": 39, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 28, "n_attrs": 13, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.runner.default_moe_runner", "names": [ "vllm.model_executor.layers.fused_moe.runner.default_moe_runner.DefaultMoERunner", "vllm.model_executor.layers.fused_moe.runner.default_moe_runner.get_layer_from_name", "vllm.model_executor.layers.fused_moe.runner.default_moe_runner.logger" ], "n_typable": 56, "n_typed": 41, "n_any": 0, "n_untyped": 15, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 28, "n_classes": 1, "n_attrs": 14, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/runner/moe_runner.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.runner.moe_runner.MoERunner", "methods": [ { "kind": "function", "name": "MoERunner.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoERunner.must_reduce_shared_expert_outputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoERunner.maybe_all_reduce_tensor_model_parallel", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.runner.moe_runner", "names": [ "vllm.model_executor.layers.fused_moe.runner.moe_runner.MoERunner" ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/topk_weight_and_reduce.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.topk_weight_and_reduce.TopKWeightAndReduceNaiveBatched", "methods": [ { "kind": "function", "name": "TopKWeightAndReduceNaiveBatched.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TopKWeightAndReduceNaiveBatched.__eq__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TopKWeightAndReduceNaiveBatched.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TopKWeightAndReduceNaiveBatched.rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.topk_weight_and_reduce.TopKWeightAndReduceNoOP", "methods": [ { "kind": "function", "name": "TopKWeightAndReduceNoOP.__eq__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TopKWeightAndReduceNoOP.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.topk_weight_and_reduce.TopKWeightAndReduceContiguous", "methods": [ { "kind": "function", "name": "TopKWeightAndReduceContiguous.__eq__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TopKWeightAndReduceContiguous.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.topk_weight_and_reduce.TopKWeightAndReduceDelegate", "methods": [ { "kind": "function", "name": "TopKWeightAndReduceDelegate.__eq__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TopKWeightAndReduceDelegate.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.topk_weight_and_reduce", "names": [ "vllm.model_executor.layers.fused_moe.topk_weight_and_reduce.TopKWeightAndReduceContiguous", "vllm.model_executor.layers.fused_moe.topk_weight_and_reduce.TopKWeightAndReduceDelegate", "vllm.model_executor.layers.fused_moe.topk_weight_and_reduce.TopKWeightAndReduceNaiveBatched", "vllm.model_executor.layers.fused_moe.topk_weight_and_reduce.TopKWeightAndReduceNoOP" ], "n_typable": 35, "n_typed": 25, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 25, "n_classes": 4, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/triton_cutlass_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.triton_cutlass_moe.TritonOrCutlassExperts", "methods": [ { "kind": "function", "name": "TritonOrCutlassExperts.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TritonOrCutlassExperts.get_clses", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonOrCutlassExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "TritonOrCutlassExperts._select_experts_impl", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TritonOrCutlassExperts.is_sm100", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.triton_cutlass_moe", "names": [ "vllm.model_executor.layers.fused_moe.triton_cutlass_moe.TritonOrCutlassExperts" ], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/trtllm_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.fused_moe.trtllm_moe.TrtLlmGenExperts", "methods": [ { "kind": "function", "name": "TrtLlmGenExperts.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TrtLlmGenExperts.activation_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmGenExperts._supports_current_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmGenExperts._supports_no_act_and_mul", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmGenExperts._supports_quant_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TrtLlmGenExperts._supports_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TrtLlmGenExperts._supports_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TrtLlmGenExperts.supports_chunking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmGenExperts.supports_expert_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmGenExperts.finalize_weight_and_reduce_impl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TrtLlmGenExperts.workspace_shapes", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "TrtLlmGenExperts.apply", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TrtLlmGenExperts.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmGenExperts.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmGenExperts.gemm1_alpha", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmGenExperts.gemm1_beta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmGenExperts.gemm1_clamp_limit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TrtLlmGenExperts.max_capture_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 48, "n_typed": 39, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 30, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.trtllm_moe", "names": [ "vllm.model_executor.layers.fused_moe.trtllm_moe.TrtLlmGenExperts" ], "n_typable": 48, "n_typed": 39, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 30, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/fused_moe/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.utils.normalize_batched_scales_shape", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.utils.count_expert_num_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.utils.moe_kernel_quantize_input", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.utils.normalize_scales_shape", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.fused_moe.utils.disable_inplace", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.fused_moe.utils", "names": [ "vllm.model_executor.layers.fused_moe.utils.count_expert_num_tokens", "vllm.model_executor.layers.fused_moe.utils.disable_inplace", "vllm.model_executor.layers.fused_moe.utils.moe_kernel_quantize_input", "vllm.model_executor.layers.fused_moe.utils.normalize_batched_scales_shape", "vllm.model_executor.layers.fused_moe.utils.normalize_scales_shape" ], "n_typable": 18, "n_typed": 18, "n_any": 0, "n_untyped": 0, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 13, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/kda.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.kda.KimiDeltaAttention", "methods": [ { "kind": "function", "name": "KimiDeltaAttention.get_state_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KimiDeltaAttention.get_state_shape", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KimiDeltaAttention.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "KimiDeltaAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KimiDeltaAttention._forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "KimiDeltaAttention.mamba_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "KimiDeltaAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.local_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.conv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.q_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.k_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.v_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.f_a_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.f_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.dt_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.q_conv1d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.k_conv1d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.v_conv1d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.A_log", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.g_a_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.g_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.o_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDeltaAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 49, "n_typed": 22, "n_any": 0, "n_untyped": 27, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 17, "n_attrs": 26, "n_properties": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.kda.kda_attention_fake", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "attr", "name": "vllm.model_executor.layers.kda.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.kda.kda_attention", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "type_ignores": [], "name": "vllm.model_executor.layers.kda", "names": [ "vllm.model_executor.layers.kda.KimiDeltaAttention", "vllm.model_executor.layers.kda.kda_attention", "vllm.model_executor.layers.kda.kda_attention_fake", "vllm.model_executor.layers.kda.logger" ], "n_typable": 66, "n_typed": 38, "n_any": 0, "n_untyped": 28, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 14, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 17, "n_classes": 1, "n_attrs": 27, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/layernorm.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.layernorm.poly_norm", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.layers.layernorm.LayerNorm", "methods": [ { "kind": "function", "name": "LayerNorm.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LayerNorm.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LayerNorm.dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LayerNorm.eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LayerNorm.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LayerNorm.bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 3, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.layernorm.RMSNormGated", "methods": [ { "kind": "function", "name": "RMSNormGated.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "RMSNormGated.reset_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RMSNormGated.forward_native", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RMSNormGated.forward_cuda", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RMSNormGated.eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNormGated.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNormGated.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNormGated.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNormGated.norm_before_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.layernorm.RMSNorm", "methods": [ { "kind": "function", "name": "RMSNorm.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "RMSNorm.forward_static", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "RMSNorm.forward_native", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RMSNorm.forward_cuda", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RMSNorm.forward_hip", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RMSNorm.forward_xpu", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RMSNorm.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RMSNorm.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNorm.variance_epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNorm.variance_size_override", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNorm.has_weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNorm.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNorm.rocm_norm_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RMSNorm.rocm_norm_func_with_add", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 27, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 20, "n_attrs": 7, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.layernorm.rms_norm", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.layernorm.fused_add_rms_norm", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.layernorm.dispatch_rocm_rmsnorm_func", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.layers.layernorm.GemmaRMSNorm", "methods": [ { "kind": "function", "name": "GemmaRMSNorm.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GemmaRMSNorm._forward_static_no_residual", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GemmaRMSNorm._forward_static_with_residual", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GemmaRMSNorm.forward_native", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GemmaRMSNorm.forward_cuda", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GemmaRMSNorm.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaRMSNorm.variance_epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 18, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.layernorm.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.layernorm", "names": [ "vllm.model_executor.layers.layernorm.GemmaRMSNorm", "vllm.model_executor.layers.layernorm.LayerNorm", "vllm.model_executor.layers.layernorm.RMSNorm", "vllm.model_executor.layers.layernorm.RMSNormGated", "vllm.model_executor.layers.layernorm.dispatch_rocm_rmsnorm_func", "vllm.model_executor.layers.layernorm.fused_add_rms_norm", "vllm.model_executor.layers.layernorm.logger", "vllm.model_executor.layers.layernorm.poly_norm", "vllm.model_executor.layers.layernorm.rms_norm" ], "n_typable": 102, "n_typed": 78, "n_any": 0, "n_untyped": 24, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 14, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 47, "n_classes": 4, "n_attrs": 19, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/lightning_attn.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.lightning_attn.linear_decode_forward_triton", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.model_executor.layers.lightning_attn.lightning_attention", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.model_executor.layers.lightning_attn", "names": [ "vllm.model_executor.layers.lightning_attn.lightning_attention", "vllm.model_executor.layers.lightning_attn.linear_decode_forward_triton" ], "n_typable": 15, "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 13, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/linear.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.linear.WEIGHT_LOADER_V2_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.linear.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.linear.LinearMethodBase", "methods": [ { "kind": "function", "name": "LinearMethodBase.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "LinearMethodBase.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 10, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.linear.adjust_scalar_to_fused_array", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.linear.adjust_block_scale_shard", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.layers.linear.QKVParallelLinear", "methods": [ { "kind": "function", "name": "QKVParallelLinear.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "QKVParallelLinear.validate_shard_id", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QKVParallelLinear._get_shard_offset_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QKVParallelLinear._get_shard_size_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QKVParallelLinear._load_fused_module_from_checkpoint", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QKVParallelLinear.weight_loader_v2", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "QKVParallelLinear.weight_loader", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QKVParallelLinear.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QKVParallelLinear.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QKVParallelLinear.v_head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QKVParallelLinear.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QKVParallelLinear.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QKVParallelLinear.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QKVParallelLinear.output_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QKVParallelLinear.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QKVParallelLinear.num_kv_head_replicas", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 39, "n_typed": 23, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 23, "n_attrs": 9, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.linear.adjust_marlin_shard", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.layers.linear.UnquantizedLinearMethod", "methods": [ { "kind": "function", "name": "UnquantizedLinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "UnquantizedLinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UnquantizedLinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 14, "n_typed": 12, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.linear.adjust_bitsandbytes_4bit_shard", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.layers.linear.ColumnParallelLinear", "methods": [ { "kind": "function", "name": "ColumnParallelLinear.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "ColumnParallelLinear._maybe_allow_fp8_block_shape_mismatch", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ColumnParallelLinear.weight_loader", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ColumnParallelLinear.weight_loader_v2", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ColumnParallelLinear.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColumnParallelLinear.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ColumnParallelLinear.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColumnParallelLinear.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColumnParallelLinear.input_size_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColumnParallelLinear.output_size_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColumnParallelLinear.output_partition_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColumnParallelLinear.gather_output", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColumnParallelLinear.bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 17, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.linear.LinearBase", "methods": [ { "kind": "function", "name": "LinearBase.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "LinearBase.update_param_tp_status", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LinearBase.input_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LinearBase.output_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LinearBase.skip_bias_add", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LinearBase.params_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LinearBase.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LinearBase.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LinearBase.allow_fp8_block_shape_mismatch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LinearBase.return_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LinearBase.disable_tp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LinearBase.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LinearBase.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LinearBase.quant_method", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 22, "n_typed": 9, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.linear.RowParallelLinear", "methods": [ { "kind": "function", "name": "RowParallelLinear.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "RowParallelLinear.weight_loader", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RowParallelLinear.weight_loader_v2", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RowParallelLinear.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RowParallelLinear.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RowParallelLinear.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RowParallelLinear.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RowParallelLinear.input_size_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RowParallelLinear.output_size_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RowParallelLinear.output_partition_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RowParallelLinear.input_is_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RowParallelLinear.reduce_results", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RowParallelLinear.bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 17, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 16, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.linear.ReplicatedLinear", "methods": [ { "kind": "function", "name": "ReplicatedLinear.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "ReplicatedLinear.weight_loader", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ReplicatedLinear.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ReplicatedLinear.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ReplicatedLinear.output_partition_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ReplicatedLinear.bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 14, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.linear.MergedColumnParallelLinear", "methods": [ { "kind": "function", "name": "MergedColumnParallelLinear.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "MergedColumnParallelLinear.validate_shard_id", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MergedColumnParallelLinear.weight_loader", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MergedColumnParallelLinear._load_fused_module_from_checkpoint", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MergedColumnParallelLinear.weight_loader_v2", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MergedColumnParallelLinear.output_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MergedColumnParallelLinear.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MergedColumnParallelLinear.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 20, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 20, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.linear", "names": [ "vllm.model_executor.layers.linear.ColumnParallelLinear", "vllm.model_executor.layers.linear.LinearBase", "vllm.model_executor.layers.linear.LinearMethodBase", "vllm.model_executor.layers.linear.MergedColumnParallelLinear", "vllm.model_executor.layers.linear.QKVParallelLinear", "vllm.model_executor.layers.linear.ReplicatedLinear", "vllm.model_executor.layers.linear.RowParallelLinear", "vllm.model_executor.layers.linear.UnquantizedLinearMethod", "vllm.model_executor.layers.linear.WEIGHT_LOADER_V2_SUPPORTED", "vllm.model_executor.layers.linear.adjust_bitsandbytes_4bit_shard", "vllm.model_executor.layers.linear.adjust_block_scale_shard", "vllm.model_executor.layers.linear.adjust_marlin_shard", "vllm.model_executor.layers.linear.adjust_scalar_to_fused_array", "vllm.model_executor.layers.linear.logger" ], "n_typable": 207, "n_typed": 138, "n_any": 0, "n_untyped": 69, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 12, "n_methods": 34, "n_method_overloads": 34, "n_method_params": 115, "n_classes": 8, "n_attrs": 43, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/logits_processor.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.logits_processor.LogitsProcessor", "methods": [ { "kind": "function", "name": "LogitsProcessor.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LogitsProcessor.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LogitsProcessor._gather_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LogitsProcessor._get_logits", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LogitsProcessor.get_top_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LogitsProcessor.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LogitsProcessor.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitsProcessor.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitsProcessor.logits_as_input", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitsProcessor.org_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitsProcessor.soft_cap", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitsProcessor.use_all_gather", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 21, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.logits_processor", "names": [ "vllm.model_executor.layers.logits_processor.LogitsProcessor" ], "n_typable": 27, "n_typed": 21, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/mamba/abstract.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.mamba.abstract.MambaBase", "methods": [ { "kind": "function", "name": "MambaBase.get_state_shape", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MambaBase.get_state_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MambaBase.get_kv_cache_spec", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MambaBase.get_attn_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "MambaBase.mamba_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MambaBase.kv_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 1, "n_attrs": 1, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.mamba.abstract", "names": [ "vllm.model_executor.layers.mamba.abstract.MambaBase" ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 1, "n_classes": 1, "n_attrs": 1, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/mamba/linear_attn.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.mamba.linear_attn.linear_attention_fake", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.linear_attn.linear_attention", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.layers.mamba.linear_attn.MiniMaxText01LinearAttention", "methods": [ { "kind": "function", "name": "MiniMaxText01LinearAttention.get_state_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniMaxText01LinearAttention.get_state_shape", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniMaxText01LinearAttention.__init__", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "MiniMaxText01LinearAttention.weight_direct_load", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniMaxText01LinearAttention._build_slope_tensor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxText01LinearAttention._prefill_and_mix_infer", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MiniMaxText01LinearAttention._decode_infer", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MiniMaxText01LinearAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniMaxText01LinearAttention._forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "MiniMaxText01LinearAttention.mamba_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MiniMaxText01LinearAttention.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.BLOCK", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.hidden_inner_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.tp_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.qkv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.tp_hidden", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.output_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.tp_slope", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01LinearAttention.slope_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 65, "n_typed": 29, "n_any": 0, "n_untyped": 36, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 34, "n_attrs": 21, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.mamba.linear_attn.MiniMaxText01LinearKernel", "methods": [ { "kind": "function", "name": "MiniMaxText01LinearKernel.jit_linear_forward_prefix", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.linear_attn.clear_linear_attention_cache_for_new_sequences", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.linear_attn.linear_attention_prefill_and_mix", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.linear_attn.linear_attention_decode", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "class", "name": "vllm.model_executor.layers.mamba.linear_attn.MiniMaxText01RMSNormTP", "methods": [ { "kind": "function", "name": "MiniMaxText01RMSNormTP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniMaxText01RMSNormTP.weight_loader", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniMaxText01RMSNormTP._forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxText01RMSNormTP.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniMaxText01RMSNormTP.forward_qk", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxText01RMSNormTP.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MiniMaxText01RMSNormTP.tp_world", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01RMSNormTP.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01RMSNormTP.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01RMSNormTP.variance_epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 16, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 11, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.mamba.linear_attn", "names": [ "vllm.model_executor.layers.mamba.linear_attn.MiniMaxText01LinearAttention", "vllm.model_executor.layers.mamba.linear_attn.MiniMaxText01LinearKernel", "vllm.model_executor.layers.mamba.linear_attn.MiniMaxText01RMSNormTP", "vllm.model_executor.layers.mamba.linear_attn.clear_linear_attention_cache_for_new_sequences", "vllm.model_executor.layers.mamba.linear_attn.linear_attention", "vllm.model_executor.layers.mamba.linear_attn.linear_attention_decode", "vllm.model_executor.layers.mamba.linear_attn.linear_attention_fake", "vllm.model_executor.layers.mamba.linear_attn.linear_attention_prefill_and_mix" ], "n_typable": 132, "n_typed": 91, "n_any": 0, "n_untyped": 41, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 33, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 53, "n_classes": 3, "n_attrs": 26, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/mamba/mamba_mixer.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.mamba.mamba_mixer.split_batch_to_prefill_and_decode", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.layers.mamba.mamba_mixer.PrefillDecodeSplit", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PrefillDecodeSplit.hidden_states_BC_p", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrefillDecodeSplit.hidden_states_BC_d", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrefillDecodeSplit.gate_p", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrefillDecodeSplit.gate_d", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.mamba.mamba_mixer.MambaMixer", "methods": [ { "kind": "function", "name": "MambaMixer.__init__", "n_typed": 14, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "MambaMixer._ssm_transform", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MambaMixer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MambaMixer.forward_impl", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MambaMixer.get_state_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MambaMixer.get_state_shape", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MambaMixer._time_proj_bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "MambaMixer.mamba_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MambaMixer.time_step_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.ssm_state_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.use_rms_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.is_lora_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.conv_kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.conv1d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.in_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.x_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.dt_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.A", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.D", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.dt_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.b_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.c_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.kv_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 49, "n_typed": 24, "n_any": 0, "n_untyped": 25, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 20, "n_attrs": 21, "n_properties": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.mamba_mixer.mamba_mixer_fake", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.mamba_mixer.mamba_mixer", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.layers.mamba.mamba_mixer", "names": [ "vllm.model_executor.layers.mamba.mamba_mixer.MambaMixer", "vllm.model_executor.layers.mamba.mamba_mixer.PrefillDecodeSplit", "vllm.model_executor.layers.mamba.mamba_mixer.mamba_mixer", "vllm.model_executor.layers.mamba.mamba_mixer.mamba_mixer_fake", "vllm.model_executor.layers.mamba.mamba_mixer.split_batch_to_prefill_and_decode" ], "n_typable": 62, "n_typed": 37, "n_any": 0, "n_untyped": 25, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 10, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 20, "n_classes": 2, "n_attrs": 25, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/mamba/mamba_mixer2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.mamba.mamba_mixer2.MambaMixer2", "methods": [ { "kind": "function", "name": "MambaMixer2.__init__", "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "MambaMixer2.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MambaMixer2.conv_ssm_forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MambaMixer2.get_state_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MambaMixer2.get_state_shape", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "MambaMixer2.mamba_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MambaMixer2.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.ssm_state_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.conv_kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.n_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.groups_ssm_state_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.conv_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.A", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.D", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.dt_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.use_rms_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.split_hidden_states_B_C_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.kv_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.num_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.tped_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.tped_conv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.tped_dt_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.is_blackwell", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.conv1d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaMixer2.in_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 54, "n_typed": 23, "n_any": 0, "n_untyped": 31, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 20, "n_attrs": 28, "n_properties": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.mamba_mixer2.mamba_mixer2", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.mamba_mixer2.mamba_mixer2_fake", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.mamba_mixer2.mamba_v2_sharded_weight_loader", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.layers.mamba.mamba_mixer2.Mixer2RMSNormGated", "methods": [ { "kind": "function", "name": "Mixer2RMSNormGated.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Mixer2RMSNormGated.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Mixer2RMSNormGated.forward_cuda", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Mixer2RMSNormGated.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mixer2RMSNormGated.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mixer2RMSNormGated.full_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mixer2RMSNormGated.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mixer2RMSNormGated.per_rank_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mixer2RMSNormGated.n_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mixer2RMSNormGated.variance_epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mixer2RMSNormGated.use_rms_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mixer2RMSNormGated.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 9, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.mamba.mamba_mixer2", "names": [ "vllm.model_executor.layers.mamba.mamba_mixer2.MambaMixer2", "vllm.model_executor.layers.mamba.mamba_mixer2.Mixer2RMSNormGated", "vllm.model_executor.layers.mamba.mamba_mixer2.mamba_mixer2", "vllm.model_executor.layers.mamba.mamba_mixer2.mamba_mixer2_fake", "vllm.model_executor.layers.mamba.mamba_mixer2.mamba_v2_sharded_weight_loader" ], "n_typable": 86, "n_typed": 44, "n_any": 0, "n_untyped": 42, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 9, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 28, "n_classes": 2, "n_attrs": 37, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/mamba/mamba_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.mamba.mamba_utils.get_temporal_copy_spec", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.model_executor.layers.mamba.mamba_utils.MambaStateCopyFunc", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.mamba.mamba_utils.MambaCopySpec", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MambaCopySpec.start_addr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MambaCopySpec.num_elements", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.mamba_utils.get_conv_copy_spec", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.layers.mamba.mamba_utils.MambaStateDtypeCalculator", "methods": [ { "kind": "function", "name": "MambaStateDtypeCalculator.linear_attention_state_dtype", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MambaStateDtypeCalculator.mamba1_state_dtype", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MambaStateDtypeCalculator.mamba2_state_dtype", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MambaStateDtypeCalculator._mamba_state_dtype", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MambaStateDtypeCalculator.short_conv_state_dtype", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MambaStateDtypeCalculator.gated_delta_net_state_dtype", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MambaStateDtypeCalculator.kda_state_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 25, "n_typed": 24, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 18, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.mamba.mamba_utils.MambaStateShapeCalculator", "methods": [ { "kind": "function", "name": "MambaStateShapeCalculator.linear_attention_state_shape", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MambaStateShapeCalculator.mamba1_state_shape", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MambaStateShapeCalculator.mamba2_state_shape", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "MambaStateShapeCalculator.short_conv_state_shape", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MambaStateShapeCalculator.extra_groups_for_head_shards", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MambaStateShapeCalculator.gated_delta_net_state_shape", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "MambaStateShapeCalculator.kda_state_shape", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [], "n_typable": 41, "n_typed": 39, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 34, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.mamba.mamba_utils.MambaStateCopyFuncCalculator", "methods": [ { "kind": "function", "name": "MambaStateCopyFuncCalculator.linear_attention_state_copy_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MambaStateCopyFuncCalculator.mamba1_state_copy_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MambaStateCopyFuncCalculator.mamba2_state_copy_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MambaStateCopyFuncCalculator.short_conv_state_copy_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MambaStateCopyFuncCalculator.gated_delta_net_state_copy_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MambaStateCopyFuncCalculator.kda_state_copy_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.mamba.mamba_utils", "names": [ "vllm.model_executor.layers.mamba.mamba_utils.MambaCopySpec", "vllm.model_executor.layers.mamba.mamba_utils.MambaStateCopyFunc", "vllm.model_executor.layers.mamba.mamba_utils.MambaStateCopyFuncCalculator", "vllm.model_executor.layers.mamba.mamba_utils.MambaStateDtypeCalculator", "vllm.model_executor.layers.mamba.mamba_utils.MambaStateShapeCalculator", "vllm.model_executor.layers.mamba.mamba_utils.get_conv_copy_spec", "vllm.model_executor.layers.mamba.mamba_utils.get_temporal_copy_spec" ], "n_typable": 83, "n_typed": 74, "n_any": 0, "n_untyped": 9, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 8, "n_methods": 20, "n_method_overloads": 20, "n_method_params": 52, "n_classes": 4, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/mamba/ops/causal_conv1d.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.mamba.ops.causal_conv1d.causal_conv1d_fn", "n_typed": 13, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.ops.causal_conv1d.causal_conv1d_update", "n_typed": 12, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 } ], "type_ignores": [], "name": "vllm.model_executor.layers.mamba.ops.causal_conv1d", "names": [ "vllm.model_executor.layers.mamba.ops.causal_conv1d.causal_conv1d_fn", "vllm.model_executor.layers.mamba.ops.causal_conv1d.causal_conv1d_update" ], "n_typable": 31, "n_typed": 25, "n_any": 0, "n_untyped": 6, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 29, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/mamba/ops/layernorm_gated.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.mamba.ops.layernorm_gated.rms_norm_gated", "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "type_ignores": [], "name": "vllm.model_executor.layers.mamba.ops.layernorm_gated", "names": [ "vllm.model_executor.layers.mamba.ops.layernorm_gated.rms_norm_gated" ], "n_typable": 8, "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/mamba/ops/mamba_ssm.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.mamba.ops.mamba_ssm.TRITON3", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.ops.mamba_ssm.selective_state_update", "n_typed": 0, "n_any": 0, "n_untyped": 18, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.ops.mamba_ssm.selective_scan_fn", "n_typed": 1, "n_any": 0, "n_untyped": 20, "n_overloads": 1, "n_typable": 21, "n_params": 20, "n_function_overloads": 1, "n_function_params": 20 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.ops.mamba_ssm.softplus", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.mamba.ops.mamba_ssm", "names": [ "vllm.model_executor.layers.mamba.ops.mamba_ssm.TRITON3", "vllm.model_executor.layers.mamba.ops.mamba_ssm.selective_scan_fn", "vllm.model_executor.layers.mamba.ops.mamba_ssm.selective_state_update", "vllm.model_executor.layers.mamba.ops.mamba_ssm.softplus" ], "n_typable": 42, "n_typed": 1, "n_any": 0, "n_untyped": 41, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 38, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/mamba/ops/ssd_chunk_scan.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.mamba.ops.ssd_chunk_scan.TRITON_22", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.mamba.ops.ssd_chunk_scan", "names": [ "vllm.model_executor.layers.mamba.ops.ssd_chunk_scan.TRITON_22" ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/mamba/ops/ssd_chunk_state.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.mamba.ops.ssd_chunk_state.chunk_state_varlen", "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "type_ignores": [], "name": "vllm.model_executor.layers.mamba.ops.ssd_chunk_state", "names": [ "vllm.model_executor.layers.mamba.ops.ssd_chunk_state.chunk_state_varlen" ], "n_typable": 8, "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/mamba/ops/ssd_combined.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.mamba.ops.ssd_combined.TRITON_22", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.ops.ssd_combined.is_int_pow_2", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.ops.ssd_combined.mamba_chunk_scan_combined_varlen", "n_typed": 0, "n_any": 0, "n_untyped": 20, "n_overloads": 1, "n_typable": 20, "n_params": 19, "n_function_overloads": 1, "n_function_params": 19 } ], "type_ignores": [], "name": "vllm.model_executor.layers.mamba.ops.ssd_combined", "names": [ "vllm.model_executor.layers.mamba.ops.ssd_combined.TRITON_22", "vllm.model_executor.layers.mamba.ops.ssd_combined.is_int_pow_2", "vllm.model_executor.layers.mamba.ops.ssd_combined.mamba_chunk_scan_combined_varlen" ], "n_typable": 23, "n_typed": 0, "n_any": 0, "n_untyped": 23, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 20, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/mamba/short_conv.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.mamba.short_conv.ShortConv", "methods": [ { "kind": "function", "name": "ShortConv.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ShortConv.forward_native", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ShortConv.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ShortConv.forward_cuda", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ShortConv.get_state_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ShortConv.get_state_shape", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "ShortConv.mamba_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ShortConv.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShortConv.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShortConv.conv_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShortConv.L_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShortConv.bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShortConv.conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShortConv.in_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShortConv.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShortConv.kv_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShortConv.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShortConv.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ShortConv.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 14, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_attrs": 12, "n_properties": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.short_conv.short_conv", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.mamba.short_conv.short_conv_fake", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.layers.mamba.short_conv", "names": [ "vllm.model_executor.layers.mamba.short_conv.ShortConv", "vllm.model_executor.layers.mamba.short_conv.short_conv", "vllm.model_executor.layers.mamba.short_conv.short_conv_fake" ], "n_typable": 39, "n_typed": 22, "n_any": 0, "n_untyped": 17, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 6, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_classes": 1, "n_attrs": 12, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/mla.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.mla.MLAModules", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MLAModules.kv_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLAModules.kv_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLAModules.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLAModules.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLAModules.fused_qkv_a_proj", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLAModules.kv_a_proj_with_mqa", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLAModules.q_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLAModules.q_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLAModules.q_proj", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLAModules.indexer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLAModules.is_sparse", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLAModules.topk_indices_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLAModules.indexer_rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.mla.MultiHeadLatentAttentionWrapper", "methods": [ { "kind": "function", "name": "MultiHeadLatentAttentionWrapper.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "MultiHeadLatentAttentionWrapper.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.qk_nope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.qk_rope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.qk_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.kv_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.fused_qkv_a_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.kv_a_proj_with_mqa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.q_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.q_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.q_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.kv_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.kv_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.indexer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.indexer_rope_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.is_sparse", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.mla_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.topk_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadLatentAttentionWrapper.topk_indices_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 41, "n_typed": 17, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 15, "n_attrs": 24, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.mla", "names": [ "vllm.model_executor.layers.mla.MLAModules", "vllm.model_executor.layers.mla.MultiHeadLatentAttentionWrapper" ], "n_typable": 41, "n_typed": 17, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 15, "n_classes": 2, "n_attrs": 37, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/pooler/abstract.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.pooler.abstract.Pooler", "methods": [ { "kind": "function", "name": "Pooler.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Pooler.get_pooling_updates", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Pooler.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.pooler.abstract", "names": [ "vllm.model_executor.layers.pooler.abstract.Pooler" ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/pooler/activations.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.pooler.activations.resolve_classifier_act_fn", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.activations.PoolerMultiLabelClassify", "methods": [ { "kind": "function", "name": "PoolerMultiLabelClassify.forward_chunk", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.activations.PoolerNormalize", "methods": [ { "kind": "function", "name": "PoolerNormalize.forward_chunk", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.activations.LambdaPoolerActivation", "methods": [ { "kind": "function", "name": "LambdaPoolerActivation.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LambdaPoolerActivation.forward_chunk", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LambdaPoolerActivation.fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.activations.PoolerIdentity", "methods": [ { "kind": "function", "name": "PoolerIdentity.forward_chunk", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.pooler.activations.get_classification_act_fn", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.activations.PoolerClassify", "methods": [ { "kind": "function", "name": "PoolerClassify.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolerClassify.forward_chunk", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolerClassify.num_labels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.activations.PoolerActivation", "methods": [ { "kind": "function", "name": "PoolerActivation.wraps", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolerActivation.forward_chunk", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolerActivation.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.pooler.activations.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.pooler.activations.get_cross_encoder_act_fn", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.pooler.activations", "names": [ "vllm.model_executor.layers.pooler.activations.LambdaPoolerActivation", "vllm.model_executor.layers.pooler.activations.PoolerActivation", "vllm.model_executor.layers.pooler.activations.PoolerClassify", "vllm.model_executor.layers.pooler.activations.PoolerIdentity", "vllm.model_executor.layers.pooler.activations.PoolerMultiLabelClassify", "vllm.model_executor.layers.pooler.activations.PoolerNormalize", "vllm.model_executor.layers.pooler.activations.get_classification_act_fn", "vllm.model_executor.layers.pooler.activations.get_cross_encoder_act_fn", "vllm.model_executor.layers.pooler.activations.logger", "vllm.model_executor.layers.pooler.activations.resolve_classifier_act_fn" ], "n_typable": 31, "n_typed": 25, "n_any": 0, "n_untyped": 6, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 5, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 10, "n_classes": 6, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/pooler/common.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.pooler.common.ClassifierFn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.pooler.common.ProjectorFn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.common.PoolingParamsUpdate", "methods": [ { "kind": "function", "name": "PoolingParamsUpdate.__or__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingParamsUpdate.apply", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingParamsUpdate.requires_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.pooler.common.ActivationFn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.pooler.common", "names": [ "vllm.model_executor.layers.pooler.common.ActivationFn", "vllm.model_executor.layers.pooler.common.ClassifierFn", "vllm.model_executor.layers.pooler.common.PoolingParamsUpdate", "vllm.model_executor.layers.pooler.common.ProjectorFn" ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/pooler/seqwise/heads.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.pooler.seqwise.heads.SequencePoolerHeadOutput", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.seqwise.heads.SequencePoolerHead", "methods": [ { "kind": "function", "name": "SequencePoolerHead.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SequencePoolerHead.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.seqwise.heads.EmbeddingPoolerHead", "methods": [ { "kind": "function", "name": "EmbeddingPoolerHead.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EmbeddingPoolerHead.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EmbeddingPoolerHead.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EmbeddingPoolerHead.projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EmbeddingPoolerHead.head_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EmbeddingPoolerHead.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.seqwise.heads.ClassifierPoolerHead", "methods": [ { "kind": "function", "name": "ClassifierPoolerHead.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ClassifierPoolerHead.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ClassifierPoolerHead.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ClassifierPoolerHead.classifier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ClassifierPoolerHead.logit_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ClassifierPoolerHead.head_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ClassifierPoolerHead.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 9, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.pooler.seqwise.heads", "names": [ "vllm.model_executor.layers.pooler.seqwise.heads.ClassifierPoolerHead", "vllm.model_executor.layers.pooler.seqwise.heads.EmbeddingPoolerHead", "vllm.model_executor.layers.pooler.seqwise.heads.SequencePoolerHead", "vllm.model_executor.layers.pooler.seqwise.heads.SequencePoolerHeadOutput" ], "n_typable": 29, "n_typed": 22, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 13, "n_classes": 3, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/pooler/seqwise/poolers.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.pooler.seqwise.poolers.pooler_for_embed", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.pooler.seqwise.poolers.SequencePoolingFn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.pooler.seqwise.poolers.SequencePoolingHeadFn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.pooler.seqwise.poolers.pooler_for_classify", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.seqwise.poolers.SequencePooler", "methods": [ { "kind": "function", "name": "SequencePooler.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SequencePooler.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SequencePooler.get_pooling_updates", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SequencePooler.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SequencePooler.pooling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SequencePooler.head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.pooler.seqwise.poolers.SequencePoolerOutput", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.pooler.seqwise.poolers", "names": [ "vllm.model_executor.layers.pooler.seqwise.poolers.SequencePooler", "vllm.model_executor.layers.pooler.seqwise.poolers.SequencePoolerOutput", "vllm.model_executor.layers.pooler.seqwise.poolers.SequencePoolingFn", "vllm.model_executor.layers.pooler.seqwise.poolers.SequencePoolingHeadFn", "vllm.model_executor.layers.pooler.seqwise.poolers.pooler_for_classify", "vllm.model_executor.layers.pooler.seqwise.poolers.pooler_for_embed" ], "n_typable": 21, "n_typed": 17, "n_any": 0, "n_untyped": 4, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 5, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_classes": 1, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/pooler/seqwise/methods.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.pooler.seqwise.methods.LastPool", "methods": [ { "kind": "function", "name": "LastPool.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.seqwise.methods.CLSPool", "methods": [ { "kind": "function", "name": "CLSPool.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.seqwise.methods.MeanPool", "methods": [ { "kind": "function", "name": "MeanPool.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.seqwise.methods.SequencePoolingMethod", "methods": [ { "kind": "function", "name": "SequencePoolingMethod.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SequencePoolingMethod.get_pooling_updates", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SequencePoolingMethod.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.pooler.seqwise.methods.SequencePoolingMethodOutput", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.pooler.seqwise.methods.get_seq_pooling_method", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.pooler.seqwise.methods", "names": [ "vllm.model_executor.layers.pooler.seqwise.methods.CLSPool", "vllm.model_executor.layers.pooler.seqwise.methods.LastPool", "vllm.model_executor.layers.pooler.seqwise.methods.MeanPool", "vllm.model_executor.layers.pooler.seqwise.methods.SequencePoolingMethod", "vllm.model_executor.layers.pooler.seqwise.methods.SequencePoolingMethodOutput", "vllm.model_executor.layers.pooler.seqwise.methods.get_seq_pooling_method" ], "n_typable": 18, "n_typed": 17, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_classes": 4, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/pooler/special.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.pooler.special.IdentityPooler", "methods": [ { "kind": "function", "name": "IdentityPooler.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "IdentityPooler.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.special.BOSEOSFilter", "methods": [ { "kind": "function", "name": "BOSEOSFilter.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BOSEOSFilter.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BOSEOSFilter.get_pooling_updates", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BOSEOSFilter.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BOSEOSFilter.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BOSEOSFilter.bos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BOSEOSFilter.eos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 10, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.special.DispatchPooler", "methods": [ { "kind": "function", "name": "DispatchPooler.for_embedding", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DispatchPooler.for_seq_cls", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DispatchPooler.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DispatchPooler.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DispatchPooler.get_pooling_updates", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DispatchPooler.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DispatchPooler.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DispatchPooler.poolers_by_task", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 13, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 8, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.pooler.special", "names": [ "vllm.model_executor.layers.pooler.special.BOSEOSFilter", "vllm.model_executor.layers.pooler.special.DispatchPooler", "vllm.model_executor.layers.pooler.special.IdentityPooler" ], "n_typable": 33, "n_typed": 27, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 16, "n_classes": 3, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/pooler/tokwise/heads.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.pooler.tokwise.heads.TokenEmbeddingPoolerHead", "methods": [ { "kind": "function", "name": "TokenEmbeddingPoolerHead.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TokenEmbeddingPoolerHead.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TokenEmbeddingPoolerHead.forward_chunk", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TokenEmbeddingPoolerHead.head_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TokenEmbeddingPoolerHead.projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TokenEmbeddingPoolerHead.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.pooler.tokwise.heads.TokenPoolerHeadOutputItem", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.tokwise.heads.TokenClassifierPoolerHead", "methods": [ { "kind": "function", "name": "TokenClassifierPoolerHead.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "TokenClassifierPoolerHead.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TokenClassifierPoolerHead.forward_chunk", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TokenClassifierPoolerHead.classifier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TokenClassifierPoolerHead.logit_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TokenClassifierPoolerHead.head_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TokenClassifierPoolerHead.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 9, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.tokwise.heads.TokenPoolerHead", "methods": [ { "kind": "function", "name": "TokenPoolerHead.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TokenPoolerHead.forward_chunk", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TokenPoolerHead.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.pooler.tokwise.heads", "names": [ "vllm.model_executor.layers.pooler.tokwise.heads.TokenClassifierPoolerHead", "vllm.model_executor.layers.pooler.tokwise.heads.TokenEmbeddingPoolerHead", "vllm.model_executor.layers.pooler.tokwise.heads.TokenPoolerHead", "vllm.model_executor.layers.pooler.tokwise.heads.TokenPoolerHeadOutputItem" ], "n_typable": 32, "n_typed": 25, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 15, "n_classes": 3, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/pooler/tokwise/methods.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.pooler.tokwise.methods.TokenPoolingMethodOutputItem", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.tokwise.methods.AllPool", "methods": [ { "kind": "function", "name": "AllPool.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AllPool.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AllPool.enable_chunked_prefill", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.tokwise.methods.TokenPoolingMethod", "methods": [ { "kind": "function", "name": "TokenPoolingMethod.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TokenPoolingMethod.get_pooling_updates", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TokenPoolingMethod.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.tokwise.methods.StepPool", "methods": [ { "kind": "function", "name": "StepPool.get_pooling_updates", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StepPool.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.pooler.tokwise.methods.get_tok_pooling_method", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.pooler.tokwise.methods", "names": [ "vllm.model_executor.layers.pooler.tokwise.methods.AllPool", "vllm.model_executor.layers.pooler.tokwise.methods.StepPool", "vllm.model_executor.layers.pooler.tokwise.methods.TokenPoolingMethod", "vllm.model_executor.layers.pooler.tokwise.methods.TokenPoolingMethodOutputItem", "vllm.model_executor.layers.pooler.tokwise.methods.get_tok_pooling_method" ], "n_typable": 19, "n_typed": 16, "n_any": 0, "n_untyped": 3, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 8, "n_classes": 3, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/pooler/tokwise/poolers.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.pooler.tokwise.poolers.pooler_for_token_classify", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.model_executor.layers.pooler.tokwise.poolers.TokenPoolerOutput", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.pooler.tokwise.poolers.TokenPooler", "methods": [ { "kind": "function", "name": "TokenPooler.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TokenPooler.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TokenPooler.get_pooling_updates", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TokenPooler.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TokenPooler.pooling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TokenPooler.head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.pooler.tokwise.poolers.pooler_for_token_embed", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.layers.pooler.tokwise.poolers.TokenPoolingFn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.pooler.tokwise.poolers.TokenPoolingHeadFn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.pooler.tokwise.poolers", "names": [ "vllm.model_executor.layers.pooler.tokwise.poolers.TokenPooler", "vllm.model_executor.layers.pooler.tokwise.poolers.TokenPoolerOutput", "vllm.model_executor.layers.pooler.tokwise.poolers.TokenPoolingFn", "vllm.model_executor.layers.pooler.tokwise.poolers.TokenPoolingHeadFn", "vllm.model_executor.layers.pooler.tokwise.poolers.pooler_for_token_classify", "vllm.model_executor.layers.pooler.tokwise.poolers.pooler_for_token_embed" ], "n_typable": 22, "n_typed": 19, "n_any": 0, "n_untyped": 3, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 6, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_classes": 1, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/__init__.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.quantization.QuantizationMethods", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.get_quantization_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.QUANTIZATION_METHODS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.register_quantization_config", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization", "names": [ "vllm.model_executor.layers.quantization.QUANTIZATION_METHODS", "vllm.model_executor.layers.quantization.QuantizationMethods", "vllm.model_executor.layers.quantization.get_quantization_config", "vllm.model_executor.layers.quantization.register_quantization_config" ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 2, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/base_config.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.base_config.QuantizationConfig", "methods": [ { "kind": "function", "name": "QuantizationConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QuantizationConfig.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QuantizationConfig.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QuantizationConfig.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QuantizationConfig.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QuantizationConfig.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuantizationConfig.override_quantization_method", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QuantizationConfig.get_from_keys", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QuantizationConfig.get_from_keys_or", "n_typed": 2, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "QuantizationConfig.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QuantizationConfig.get_cache_scale", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuantizationConfig.apply_vllm_mapper", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuantizationConfig.maybe_update_config", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuantizationConfig.is_mxfp4_quant", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QuantizationConfig.packed_modules_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 30, "n_typed": 22, "n_any": 3, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 15, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.base_config.method_has_implemented_embedding", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.base_config.QuantizationMethods", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.base_config.QuantizeMethodBase", "methods": [ { "kind": "function", "name": "QuantizeMethodBase.create_weights", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "QuantizeMethodBase.apply", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "QuantizeMethodBase.embedding", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "QuantizeMethodBase.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QuantizeMethodBase.uses_meta_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 15, "n_typed": 8, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.base_config", "names": [ "vllm.model_executor.layers.quantization.base_config.QuantizationConfig", "vllm.model_executor.layers.quantization.base_config.QuantizationMethods", "vllm.model_executor.layers.quantization.base_config.QuantizeMethodBase", "vllm.model_executor.layers.quantization.base_config.method_has_implemented_embedding" ], "n_typable": 47, "n_typed": 32, "n_any": 3, "n_untyped": 12, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 25, "n_classes": 2, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/awq.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.awq.AWQConfig", "methods": [ { "kind": "function", "name": "AWQConfig.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AWQConfig.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AWQConfig.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AWQConfig.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AWQConfig.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AWQConfig.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AWQConfig.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AWQConfig.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AWQConfig.apply_vllm_mapper", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AWQConfig.maybe_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AWQConfig.weight_bits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQConfig.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQConfig.zero_point", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQConfig.modules_to_not_convert", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQConfig.pack_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 18, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 10, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.awq.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.awq.AWQLinearMethod", "methods": [ { "kind": "function", "name": "AWQLinearMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AWQLinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "AWQLinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AWQLinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AWQLinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 13, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.awq", "names": [ "vllm.model_executor.layers.quantization.awq.AWQConfig", "vllm.model_executor.layers.quantization.awq.AWQLinearMethod", "vllm.model_executor.layers.quantization.awq.logger" ], "n_typable": 43, "n_typed": 31, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 22, "n_classes": 2, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/awq_marlin.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.awq_marlin.AWQMarlinConfig", "methods": [ { "kind": "function", "name": "AWQMarlinConfig.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "AWQMarlinConfig.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AWQMarlinConfig.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AWQMarlinConfig.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AWQMarlinConfig.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AWQMarlinConfig.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AWQMarlinConfig.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AWQMarlinConfig.override_quantization_method", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AWQMarlinConfig.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AWQMarlinConfig.is_awq_marlin_compatible", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AWQMarlinConfig.apply_vllm_mapper", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AWQMarlinConfig.maybe_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AWQMarlinConfig.TYPE_MAP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AWQMarlinConfig.pack_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQMarlinConfig.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQMarlinConfig.zero_point", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQMarlinConfig.lm_head_quantized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQMarlinConfig.weight_bits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQMarlinConfig.modules_to_not_convert", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQMarlinConfig.full_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQMarlinConfig.quant_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 22, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 15, "n_attrs": 9, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.awq_marlin.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.awq_marlin.AWQMarlinLinearMethod", "methods": [ { "kind": "function", "name": "AWQMarlinLinearMethod.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AWQMarlinLinearMethod.create_weights", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "AWQMarlinLinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AWQMarlinLinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AWQMarlinLinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQMarlinLinearMethod.quant_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQMarlinLinearMethod.input_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 15, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.awq_marlin.AWQMarlinMoEMethod", "methods": [ { "kind": "function", "name": "AWQMarlinMoEMethod.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AWQMarlinMoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "AWQMarlinMoEMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AWQMarlinMoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AWQMarlinMoEMethod.select_gemm_impl", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AWQMarlinMoEMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AWQMarlinMoEMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQMarlinMoEMethod.quant_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQMarlinMoEMethod.input_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AWQMarlinMoEMethod.use_marlin", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 18, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 17, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.awq_marlin", "names": [ "vllm.model_executor.layers.quantization.awq_marlin.AWQMarlinConfig", "vllm.model_executor.layers.quantization.awq_marlin.AWQMarlinLinearMethod", "vllm.model_executor.layers.quantization.awq_marlin.AWQMarlinMoEMethod", "vllm.model_executor.layers.quantization.awq_marlin.logger" ], "n_typable": 82, "n_typed": 55, "n_any": 0, "n_untyped": 27, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 22, "n_method_overloads": 22, "n_method_params": 44, "n_classes": 3, "n_attrs": 17, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/awq_triton.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.quantization.awq_triton.AWQ_TRITON_SUPPORTED_GROUP_SIZES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.awq_triton.awq_gemm_kernel", "n_typed": 4, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.awq_triton.awq_dequantize_kernel", "n_typed": 2, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.awq_triton.awq_dequantize_triton", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.awq_triton.awq_gemm_triton", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.awq_triton", "names": [ "vllm.model_executor.layers.quantization.awq_triton.AWQ_TRITON_SUPPORTED_GROUP_SIZES", "vllm.model_executor.layers.quantization.awq_triton.awq_dequantize_kernel", "vllm.model_executor.layers.quantization.awq_triton.awq_dequantize_triton", "vllm.model_executor.layers.quantization.awq_triton.awq_gemm_kernel", "vllm.model_executor.layers.quantization.awq_triton.awq_gemm_triton" ], "n_typable": 39, "n_typed": 21, "n_any": 0, "n_untyped": 18, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 35, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/bitsandbytes.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.bitsandbytes.BitsAndBytesMoEMethod", "methods": [ { "kind": "function", "name": "BitsAndBytesMoEMethod.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BitsAndBytesMoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BitsAndBytesMoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BitsAndBytesMoEMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BitsAndBytesMoEMethod._create_weights_4bit", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BitsAndBytesMoEMethod._create_weights_8bit", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BitsAndBytesMoEMethod._apply_4bit_dequnt", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BitsAndBytesMoEMethod._apply_8bit_dequant", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BitsAndBytesMoEMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 37, "n_typed": 29, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 28, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.bitsandbytes.is_layer_skipped_bnb", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.bitsandbytes.BitsAndBytesConfig", "methods": [ { "kind": "function", "name": "BitsAndBytesConfig.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "BitsAndBytesConfig.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BitsAndBytesConfig.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BitsAndBytesConfig.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BitsAndBytesConfig.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BitsAndBytesConfig.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BitsAndBytesConfig.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BitsAndBytesConfig.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BitsAndBytesConfig.load_in_8bit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesConfig.load_in_4bit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesConfig.bnb_4bit_compute_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesConfig.bnb_4bit_quant_storage", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesConfig.bnb_4bit_quant_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesConfig.bnb_4bit_use_double_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesConfig.llm_int8_enable_fp32_cpu_offload", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesConfig.llm_int8_has_fp16_weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesConfig.llm_int8_skip_modules", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesConfig.llm_int8_threshold", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 21, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 13, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.bitsandbytes.BitsAndBytesLinearMethod", "methods": [ { "kind": "function", "name": "BitsAndBytesLinearMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BitsAndBytesLinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "BitsAndBytesLinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BitsAndBytesLinearMethod._apply_8bit_weight", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BitsAndBytesLinearMethod._apply_4bit_weight", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BitsAndBytesLinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 19, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 17, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.bitsandbytes.calculate_quant_ratio", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.bitsandbytes", "names": [ "vllm.model_executor.layers.quantization.bitsandbytes.BitsAndBytesConfig", "vllm.model_executor.layers.quantization.bitsandbytes.BitsAndBytesLinearMethod", "vllm.model_executor.layers.quantization.bitsandbytes.BitsAndBytesMoEMethod", "vllm.model_executor.layers.quantization.bitsandbytes.calculate_quant_ratio", "vllm.model_executor.layers.quantization.bitsandbytes.is_layer_skipped_bnb" ], "n_typable": 96, "n_typed": 71, "n_any": 0, "n_untyped": 25, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 3, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 58, "n_classes": 3, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors.CompressedTensorsLinearMethod", "methods": [ { "kind": "function", "name": "CompressedTensorsLinearMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsLinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsLinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "CompressedTensorsLinearMethod.apply", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompressedTensorsLinearMethod.quantization_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors.CompressedTensorsLinearMethod" ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors_moe.CompressedTensorsWNA16MarlinMoEMethod", "methods": [ { "kind": "function", "name": "CompressedTensorsWNA16MarlinMoEMethod.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CompressedTensorsWNA16MarlinMoEMethod.get_weight_shape", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CompressedTensorsWNA16MarlinMoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CompressedTensorsWNA16MarlinMoEMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsWNA16MarlinMoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsWNA16MarlinMoEMethod.select_gemm_impl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CompressedTensorsWNA16MarlinMoEMethod.apply_monolithic", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CompressedTensorsWNA16MarlinMoEMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [ { "kind": "property", "name": "CompressedTensorsWNA16MarlinMoEMethod.is_monolithic", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "CompressedTensorsWNA16MarlinMoEMethod.weight_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16MarlinMoEMethod.input_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16MarlinMoEMethod.num_bits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16MarlinMoEMethod.packed_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16MarlinMoEMethod.strategy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16MarlinMoEMethod.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16MarlinMoEMethod.actorder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16MarlinMoEMethod.quant_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16MarlinMoEMethod.marlin_input_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16MarlinMoEMethod.use_flashinfer_mxint4_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16MarlinMoEMethod.kernel_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 48, "n_typed": 34, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 28, "n_attrs": 11, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors_moe.CompressedTensorsW4A8Int8MoEMethod", "methods": [ { "kind": "function", "name": "CompressedTensorsW4A8Int8MoEMethod.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CompressedTensorsW4A8Int8MoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CompressedTensorsW4A8Int8MoEMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW4A8Int8MoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW4A8Int8MoEMethod.apply_monolithic", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "CompressedTensorsW4A8Int8MoEMethod.is_monolithic", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "CompressedTensorsW4A8Int8MoEMethod.has_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A8Int8MoEMethod.weight_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A8Int8MoEMethod.input_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A8Int8MoEMethod.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A8Int8MoEMethod.static_input_scales", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 18, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 15, "n_attrs": 5, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors_moe.CompressedTensorsMoEMethod", "methods": [ { "kind": "function", "name": "CompressedTensorsMoEMethod.get_moe_method", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors_moe.CompressedTensorsW8A8Int8MoEMethod", "methods": [ { "kind": "function", "name": "CompressedTensorsW8A8Int8MoEMethod.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CompressedTensorsW8A8Int8MoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CompressedTensorsW8A8Int8MoEMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW8A8Int8MoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW8A8Int8MoEMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompressedTensorsW8A8Int8MoEMethod.weight_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Int8MoEMethod.input_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Int8MoEMethod.static_input_scales", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 19, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 17, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors_moe.CompressedTensorsW4A4Nvfp4MoEMethod", "methods": [ { "kind": "function", "name": "CompressedTensorsW4A4Nvfp4MoEMethod.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CompressedTensorsW4A4Nvfp4MoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CompressedTensorsW4A4Nvfp4MoEMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW4A4Nvfp4MoEMethod.maybe_make_prepare_finalize", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW4A4Nvfp4MoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW4A4Nvfp4MoEMethod.apply_monolithic", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CompressedTensorsW4A4Nvfp4MoEMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompressedTensorsW4A4Nvfp4MoEMethod.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A4Nvfp4MoEMethod.use_global_sf", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 24, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 20, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors_moe.CompressedTensorsWNA16MoEMethod", "methods": [ { "kind": "function", "name": "CompressedTensorsWNA16MoEMethod.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CompressedTensorsWNA16MoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CompressedTensorsWNA16MoEMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsWNA16MoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsWNA16MoEMethod.select_gemm_impl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CompressedTensorsWNA16MoEMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [ { "kind": "property", "name": "CompressedTensorsWNA16MoEMethod.supports_eplb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "CompressedTensorsWNA16MoEMethod.weight_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16MoEMethod.input_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16MoEMethod.num_bits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16MoEMethod.packed_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16MoEMethod.strategy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16MoEMethod.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 23, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 19, "n_attrs": 6, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors_moe.CompressedTensorsW8A8Fp8MoEMethod", "methods": [ { "kind": "function", "name": "CompressedTensorsW8A8Fp8MoEMethod.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CompressedTensorsW8A8Fp8MoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CompressedTensorsW8A8Fp8MoEMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW8A8Fp8MoEMethod.maybe_make_prepare_finalize", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW8A8Fp8MoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW8A8Fp8MoEMethod.apply_monolithic", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CompressedTensorsW8A8Fp8MoEMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [ { "kind": "property", "name": "CompressedTensorsW8A8Fp8MoEMethod.supports_eplb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "CompressedTensorsW8A8Fp8MoEMethod.weight_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Fp8MoEMethod.input_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Fp8MoEMethod.block_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Fp8MoEMethod.static_input_scales", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Fp8MoEMethod.weight_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 26, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 21, "n_attrs": 5, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors_moe", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors_moe.CompressedTensorsMoEMethod", "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors_moe.CompressedTensorsW4A4Nvfp4MoEMethod", "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors_moe.CompressedTensorsW4A8Int8MoEMethod", "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors_moe.CompressedTensorsW8A8Fp8MoEMethod", "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors_moe.CompressedTensorsW8A8Int8MoEMethod", "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors_moe.CompressedTensorsWNA16MarlinMoEMethod", "vllm.model_executor.layers.quantization.compressed_tensors.compressed_tensors_moe.CompressedTensorsWNA16MoEMethod" ], "n_typable": 198, "n_typed": 148, "n_any": 0, "n_untyped": 50, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 39, "n_method_overloads": 39, "n_method_params": 123, "n_classes": 7, "n_attrs": 32, "n_properties": 4, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a8_int8.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w8a8_int8.CompressedTensorsW8A8Int8", "methods": [ { "kind": "function", "name": "CompressedTensorsW8A8Int8.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CompressedTensorsW8A8Int8.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompressedTensorsW8A8Int8.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CompressedTensorsW8A8Int8.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW8A8Int8.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompressedTensorsW8A8Int8.strategy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Int8.is_static_input_scheme", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Int8.input_symmetric", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 15, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w8a8_int8.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w8a8_int8", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w8a8_int8.CompressedTensorsW8A8Int8", "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w8a8_int8.logger" ], "n_typable": 22, "n_typed": 15, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_wNa16.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_wNa16.WNA16_SUPPORTED_BITS", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_wNa16.CompressedTensorsWNA16", "methods": [ { "kind": "function", "name": "CompressedTensorsWNA16.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CompressedTensorsWNA16.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompressedTensorsWNA16.create_weights", "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "CompressedTensorsWNA16.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsWNA16.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompressedTensorsWNA16._kernel_backends_being_used", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16.pack_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16.strategy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16.symmetric", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16.has_g_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16.layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsWNA16.quant_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 21, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 18, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_wNa16", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_wNa16.CompressedTensorsWNA16", "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_wNa16.WNA16_SUPPORTED_BITS" ], "n_typable": 32, "n_typed": 21, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 18, "n_classes": 1, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_24.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_24.CompressedTensors24", "methods": [ { "kind": "function", "name": "CompressedTensors24.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CompressedTensors24.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompressedTensors24.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "CompressedTensors24.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensors24.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CompressedTensors24._get_params_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensors24._get_quant_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompressedTensors24._decompress_bitmask_compressed_weight", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompressedTensors24.quantized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensors24.weight_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensors24.input_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensors24.do_sparse_decompress", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensors24.model_compressor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensors24.quant_fp8", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 24, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 19, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_24", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_24.CompressedTensors24" ], "n_typable": 33, "n_typed": 24, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 19, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w4a8_fp8.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w4a8_fp8.CompressedTensorsW4A8Fp8", "methods": [ { "kind": "function", "name": "CompressedTensorsW4A8Fp8.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CompressedTensorsW4A8Fp8.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompressedTensorsW4A8Fp8.create_weights", "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "CompressedTensorsW4A8Fp8.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW4A8Fp8.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompressedTensorsW4A8Fp8._kernel_backends_being_used", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A8Fp8.pack_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A8Fp8.strategy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A8Fp8.symmetric", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A8Fp8.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A8Fp8.has_g_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A8Fp8.quant_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 20, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 17, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w4a8_fp8", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w4a8_fp8.CompressedTensorsW4A8Fp8" ], "n_typable": 29, "n_typed": 20, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 17, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w4a8_int.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w4a8_int.CompressedTensorsW4A8Int", "methods": [ { "kind": "function", "name": "CompressedTensorsW4A8Int.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CompressedTensorsW4A8Int.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompressedTensorsW4A8Int.create_weights", "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "CompressedTensorsW4A8Int.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW4A8Int.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompressedTensorsW4A8Int._kernel_backends_being_used", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A8Int.strategy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A8Int.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A8Int.is_static_input_scheme", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A8Int.input_symmetric", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A8Int.quant_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 20, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 17, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w4a8_int", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w4a8_int.CompressedTensorsW4A8Int" ], "n_typable": 28, "n_typed": 20, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 17, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_scheme.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_scheme.CompressedTensorsScheme", "methods": [ { "kind": "function", "name": "CompressedTensorsScheme.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompressedTensorsScheme.create_weights", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CompressedTensorsScheme.apply_weights", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CompressedTensorsScheme.process_weights_after_loading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_scheme", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_scheme.CompressedTensorsScheme" ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a16_fp8.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w8a16_fp8.CompressedTensorsW8A16Fp8", "methods": [ { "kind": "function", "name": "CompressedTensorsW8A16Fp8.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CompressedTensorsW8A16Fp8.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompressedTensorsW8A16Fp8.create_weights", "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "CompressedTensorsW8A16Fp8.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW8A16Fp8.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompressedTensorsW8A16Fp8.weight_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A16Fp8.strategy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A16Fp8.is_static_input_scheme", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A16Fp8.weight_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 16, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 14, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w8a16_fp8", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w8a16_fp8.CompressedTensorsW8A16Fp8" ], "n_typable": 23, "n_typed": 16, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 14, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a8_fp8.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w8a8_fp8.CompressedTensorsW8A8Fp8", "methods": [ { "kind": "function", "name": "CompressedTensorsW8A8Fp8.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CompressedTensorsW8A8Fp8.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompressedTensorsW8A8Fp8.create_weights", "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "CompressedTensorsW8A8Fp8.process_weights_after_loading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW8A8Fp8.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompressedTensorsW8A8Fp8.weight_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Fp8.strategy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Fp8.out_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Fp8.is_static_input_scheme", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Fp8.weight_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Fp8.cutlass_block_fp8_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Fp8.use_aiter_and_is_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Fp8.act_q_group_shape", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Fp8.w8a8_block_fp8_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW8A8Fp8.fp8_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 15, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 14, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w8a8_fp8", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w8a8_fp8.CompressedTensorsW8A8Fp8" ], "n_typable": 29, "n_typed": 15, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 14, "n_classes": 1, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w4a4_nvfp4.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w4a4_nvfp4.CompressedTensorsW4A4Fp4", "methods": [ { "kind": "function", "name": "CompressedTensorsW4A4Fp4.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompressedTensorsW4A4Fp4.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompressedTensorsW4A4Fp4.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CompressedTensorsW4A4Fp4.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW4A4Fp4.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompressedTensorsW4A4Fp4.backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsW4A4Fp4.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w4a4_nvfp4", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w4a4_nvfp4.CompressedTensorsW4A4Fp4" ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w4a16_nvfp4.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w4a16_nvfp4.CompressedTensorsW4A16Fp4", "methods": [ { "kind": "function", "name": "CompressedTensorsW4A16Fp4.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompressedTensorsW4A16Fp4.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompressedTensorsW4A16Fp4.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CompressedTensorsW4A16Fp4.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW4A16Fp4.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompressedTensorsW4A16Fp4.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 12, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w4a16_nvfp4", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w4a16_nvfp4.CompressedTensorsW4A16Fp4" ], "n_typable": 16, "n_typed": 12, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_w4a16_mxfp4.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w4a16_mxfp4.CompressedTensorsW4A16Mxfp4", "methods": [ { "kind": "function", "name": "CompressedTensorsW4A16Mxfp4.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompressedTensorsW4A16Mxfp4.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CompressedTensorsW4A16Mxfp4.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CompressedTensorsW4A16Mxfp4.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsW4A16Mxfp4.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompressedTensorsW4A16Mxfp4.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 12, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w4a16_mxfp4", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_w4a16_mxfp4.CompressedTensorsW4A16Mxfp4" ], "n_typable": 16, "n_typed": 12, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/transform/linear.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.compressed_tensors.transform.linear.get_schemes_args", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.compressed_tensors.transform.linear.get_linear_transform_schemes", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.transform.linear.CompressedTensorsLinearTransformMethod", "methods": [ { "kind": "function", "name": "CompressedTensorsLinearTransformMethod.from_schemes", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CompressedTensorsLinearTransformMethod.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CompressedTensorsLinearTransformMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "CompressedTensorsLinearTransformMethod.process_weights_after_loading", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CompressedTensorsLinearTransformMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CompressedTensorsLinearTransformMethod._validate_tfm_schemes", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CompressedTensorsLinearTransformMethod.quant_method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsLinearTransformMethod.input_tfms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsLinearTransformMethod.output_tfms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsLinearTransformMethod.input_transform", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CompressedTensorsLinearTransformMethod.output_transform", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 30, "n_typed": 21, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 19, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.compressed_tensors.transform.linear.get_layer_partition_names", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.transform.linear", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.transform.linear.CompressedTensorsLinearTransformMethod", "vllm.model_executor.layers.quantization.compressed_tensors.transform.linear.get_layer_partition_names", "vllm.model_executor.layers.quantization.compressed_tensors.transform.linear.get_linear_transform_schemes", "vllm.model_executor.layers.quantization.compressed_tensors.transform.linear.get_schemes_args" ], "n_typable": 40, "n_typed": 31, "n_any": 0, "n_untyped": 9, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 7, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 19, "n_classes": 1, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/transform/module.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.transform.module.HadamardTransform", "methods": [ { "kind": "function", "name": "HadamardTransform.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "HadamardTransform.process_weights_after_loading", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HadamardTransform.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HadamardTransform._get_data_key", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HadamardTransform._get_weight_size", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "HadamardTransform._validate_input_transforms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HadamardTransform.transforms", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HadamardTransform.weight", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HadamardTransform.scales", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 23, "n_typed": 20, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.transform.module", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.transform.module.HadamardTransform" ], "n_typable": 23, "n_typed": 20, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/transform/schemes/linear_qutlass_nvfp4.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.transform.schemes.linear_qutlass_nvfp4.QutlassNvFP4LinearMethod", "methods": [ { "kind": "function", "name": "QutlassNvFP4LinearMethod.create_weights", "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "QutlassNvFP4LinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 4, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.compressed_tensors.transform.schemes.linear_qutlass_nvfp4.is_qutlass_fp4_scheme", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.transform.schemes.linear_qutlass_nvfp4", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.transform.schemes.linear_qutlass_nvfp4.QutlassNvFP4LinearMethod", "vllm.model_executor.layers.quantization.compressed_tensors.transform.schemes.linear_qutlass_nvfp4.is_qutlass_fp4_scheme" ], "n_typable": 15, "n_typed": 7, "n_any": 0, "n_untyped": 8, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/transform/utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.compressed_tensors.transform.utils.TransformTuple", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TransformTuple.scheme_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TransformTuple.scheme", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TransformTuple.args", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.transform.utils", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.transform.utils.TransformTuple" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/triton_scaled_mm.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.compressed_tensors.triton_scaled_mm.triton_scaled_mm", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.compressed_tensors.triton_scaled_mm.scaled_mm_kernel", "n_typed": 6, "n_any": 0, "n_untyped": 16, "n_overloads": 1, "n_typable": 22, "n_params": 21, "n_function_overloads": 1, "n_function_params": 21 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.compressed_tensors.triton_scaled_mm.is_weak_contiguous", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.triton_scaled_mm", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.triton_scaled_mm.is_weak_contiguous", "vllm.model_executor.layers.quantization.compressed_tensors.triton_scaled_mm.scaled_mm_kernel", "vllm.model_executor.layers.quantization.compressed_tensors.triton_scaled_mm.triton_scaled_mm" ], "n_typable": 35, "n_typed": 17, "n_any": 0, "n_untyped": 18, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 32, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/compressed_tensors/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.compressed_tensors.utils.find_matched_target", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.compressed_tensors.utils.should_ignore_layer", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.compressed_tensors.utils.check_equal_or_regex_match", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.compressed_tensors.utils.is_activation_quantization_format", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.compressed_tensors.utils", "names": [ "vllm.model_executor.layers.quantization.compressed_tensors.utils.check_equal_or_regex_match", "vllm.model_executor.layers.quantization.compressed_tensors.utils.find_matched_target", "vllm.model_executor.layers.quantization.compressed_tensors.utils.is_activation_quantization_format", "vllm.model_executor.layers.quantization.compressed_tensors.utils.should_ignore_layer" ], "n_typable": 14, "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 10, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/cpu_wna16.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.cpu_wna16.CPUAWQConfig", "methods": [ { "kind": "function", "name": "CPUAWQConfig.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CPUAWQConfig.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUAWQConfig.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUAWQConfig.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUAWQConfig.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUAWQConfig.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUAWQConfig.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUAWQConfig.override_quantization_method", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CPUAWQConfig.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CPUAWQConfig.apply_vllm_mapper", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUAWQConfig.maybe_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CPUAWQConfig.pack_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAWQConfig.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAWQConfig.zero_point", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAWQConfig.lm_head_quantized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAWQConfig.weight_bits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAWQConfig.modules_to_not_convert", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAWQConfig.full_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 21, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 14, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.cpu_wna16.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.cpu_wna16.CPUAWQLinearMethod", "methods": [ { "kind": "function", "name": "CPUAWQLinearMethod.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUAWQLinearMethod.create_weights", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "CPUAWQLinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUAWQLinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CPUAWQLinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 15, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.cpu_wna16", "names": [ "vllm.model_executor.layers.quantization.cpu_wna16.CPUAWQConfig", "vllm.model_executor.layers.quantization.cpu_wna16.CPUAWQLinearMethod", "vllm.model_executor.layers.quantization.cpu_wna16.logger" ], "n_typable": 50, "n_typed": 36, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 26, "n_classes": 2, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/experts_int8.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.experts_int8.quantize_in_place_and_get_scales", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.experts_int8.ExpertsInt8Config", "methods": [ { "kind": "function", "name": "ExpertsInt8Config.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ExpertsInt8Config.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ExpertsInt8Config.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ExpertsInt8Config.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ExpertsInt8Config.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ExpertsInt8Config.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExpertsInt8Config.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.experts_int8.ExpertsInt8MoEMethod", "methods": [ { "kind": "function", "name": "ExpertsInt8MoEMethod.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExpertsInt8MoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ExpertsInt8MoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExpertsInt8MoEMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ExpertsInt8MoEMethod.quantizing_weight_loader", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExpertsInt8MoEMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 15, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 16, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.experts_int8", "names": [ "vllm.model_executor.layers.quantization.experts_int8.ExpertsInt8Config", "vllm.model_executor.layers.quantization.experts_int8.ExpertsInt8MoEMethod", "vllm.model_executor.layers.quantization.experts_int8.quantize_in_place_and_get_scales" ], "n_typable": 34, "n_typed": 27, "n_any": 0, "n_untyped": 7, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 19, "n_classes": 2, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/fbgemm_fp8.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.fbgemm_fp8.FBGEMMFp8LinearMethod", "methods": [ { "kind": "function", "name": "FBGEMMFp8LinearMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FBGEMMFp8LinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "FBGEMMFp8LinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FBGEMMFp8LinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FBGEMMFp8LinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FBGEMMFp8LinearMethod.out_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FBGEMMFp8LinearMethod.fp8_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 13, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.fbgemm_fp8.FBGEMMFp8Config", "methods": [ { "kind": "function", "name": "FBGEMMFp8Config.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FBGEMMFp8Config.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FBGEMMFp8Config.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FBGEMMFp8Config.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FBGEMMFp8Config.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FBGEMMFp8Config.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FBGEMMFp8Config.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FBGEMMFp8Config.ignore_list", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FBGEMMFp8Config.input_scale_ub", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FBGEMMFp8Config.use_marlin", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 11, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.fbgemm_fp8.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.fbgemm_fp8", "names": [ "vllm.model_executor.layers.quantization.fbgemm_fp8.FBGEMMFp8Config", "vllm.model_executor.layers.quantization.fbgemm_fp8.FBGEMMFp8LinearMethod", "vllm.model_executor.layers.quantization.fbgemm_fp8.logger" ], "n_typable": 35, "n_typed": 24, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 17, "n_classes": 2, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/fp8.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.fp8.Fp8MoEMethod", "methods": [ { "kind": "function", "name": "Fp8MoEMethod.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Fp8MoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Fp8MoEMethod._setup_kernel", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Fp8MoEMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Fp8MoEMethod.maybe_make_prepare_finalize", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Fp8MoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Fp8MoEMethod.apply_monolithic", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Fp8MoEMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [ { "kind": "property", "name": "Fp8MoEMethod.supports_eplb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Fp8MoEMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8MoEMethod.weight_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8MoEMethod.block_quant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Fp8MoEMethod.weight_scale_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 39, "n_typed": 33, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 26, "n_attrs": 4, "n_properties": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.fp8.ACTIVATION_SCHEMES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.fp8.Fp8Config", "methods": [ { "kind": "function", "name": "Fp8Config.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Fp8Config.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Fp8Config.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Fp8Config.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Fp8Config.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Fp8Config.apply_vllm_mapper", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Fp8Config.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Fp8Config.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Fp8Config.get_cache_scale", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Fp8Config.is_checkpoint_fp8_serialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8Config.activation_scheme", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8Config.ignored_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8Config.weight_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 17, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 9, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.fp8.Fp8OnlineLinearMethod", "methods": [ { "kind": "function", "name": "Fp8OnlineLinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Fp8OnlineLinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Fp8OnlineLinearMethod.uses_meta_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.fp8.CopyNumelCounter", "methods": [ { "kind": "function", "name": "CopyNumelCounter.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CopyNumelCounter.__torch_dispatch__", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CopyNumelCounter.copied_numel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.fp8.Fp8LinearMethod", "methods": [ { "kind": "function", "name": "Fp8LinearMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Fp8LinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Fp8LinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Fp8LinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Fp8LinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8LinearMethod.cutlass_block_fp8_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8LinearMethod.out_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8LinearMethod.marlin_input_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8LinearMethod.use_marlin", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8LinearMethod.use_aiter_and_is_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8LinearMethod.use_deep_gemm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8LinearMethod.weight_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8LinearMethod.block_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8LinearMethod.act_q_static", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8LinearMethod.w8a8_block_fp8_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fp8LinearMethod.fp8_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 13, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.fp8.Fp8OnlineMoEMethod", "methods": [ { "kind": "function", "name": "Fp8OnlineMoEMethod.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Fp8OnlineMoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Fp8OnlineMoEMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Fp8OnlineMoEMethod.uses_meta_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 13, "n_typed": 10, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.fp8.Fp8KVCacheMethod", "methods": [ { "kind": "function", "name": "Fp8KVCacheMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.fp8.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.fp8", "names": [ "vllm.model_executor.layers.quantization.fp8.ACTIVATION_SCHEMES", "vllm.model_executor.layers.quantization.fp8.CopyNumelCounter", "vllm.model_executor.layers.quantization.fp8.Fp8Config", "vllm.model_executor.layers.quantization.fp8.Fp8KVCacheMethod", "vllm.model_executor.layers.quantization.fp8.Fp8LinearMethod", "vllm.model_executor.layers.quantization.fp8.Fp8MoEMethod", "vllm.model_executor.layers.quantization.fp8.Fp8OnlineLinearMethod", "vllm.model_executor.layers.quantization.fp8.Fp8OnlineMoEMethod", "vllm.model_executor.layers.quantization.fp8.logger" ], "n_typable": 123, "n_typed": 83, "n_any": 0, "n_untyped": 40, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 29, "n_method_overloads": 29, "n_method_params": 69, "n_classes": 7, "n_attrs": 25, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/fp_quant.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.fp_quant.quantized_forward", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.fp_quant.fused_quantize_mx", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.fp_quant.fused_quantize_nv", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.fp_quant.FPQuantConfig", "methods": [ { "kind": "function", "name": "FPQuantConfig.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FPQuantConfig.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FPQuantConfig.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FPQuantConfig.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FPQuantConfig.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FPQuantConfig.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FPQuantConfig.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FPQuantConfig.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FPQuantConfig.hadamard_group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FPQuantConfig.forward_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FPQuantConfig.forward_method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FPQuantConfig.pseudoquantization", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FPQuantConfig.modules_to_not_convert", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 16, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.fp_quant.fused_quantize_mx_fake", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.fp_quant.matmul_nvf4_bf16", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.fp_quant.matmul_mxf4_bf16_fake", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.fp_quant.matmul_nvf4_bf16_fake", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.fp_quant.FPQuantLinearMethod", "methods": [ { "kind": "function", "name": "FPQuantLinearMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FPQuantLinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "FPQuantLinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FPQuantLinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 11, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.fp_quant.matmul_mxf4_bf16", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.fp_quant.fused_quantize_nv_fake", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.fp_quant", "names": [ "vllm.model_executor.layers.quantization.fp_quant.FPQuantConfig", "vllm.model_executor.layers.quantization.fp_quant.FPQuantLinearMethod", "vllm.model_executor.layers.quantization.fp_quant.fused_quantize_mx", "vllm.model_executor.layers.quantization.fp_quant.fused_quantize_mx_fake", "vllm.model_executor.layers.quantization.fp_quant.fused_quantize_nv", "vllm.model_executor.layers.quantization.fp_quant.fused_quantize_nv_fake", "vllm.model_executor.layers.quantization.fp_quant.matmul_mxf4_bf16", "vllm.model_executor.layers.quantization.fp_quant.matmul_mxf4_bf16_fake", "vllm.model_executor.layers.quantization.fp_quant.matmul_nvf4_bf16", "vllm.model_executor.layers.quantization.fp_quant.matmul_nvf4_bf16_fake", "vllm.model_executor.layers.quantization.fp_quant.quantized_forward" ], "n_typable": 86, "n_typed": 57, "n_any": 0, "n_untyped": 29, "n_functions": 9, "n_function_overloads": 9, "n_function_params": 41, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 19, "n_classes": 2, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/gguf.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.quantization.gguf.STANDARD_QUANT_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.gguf.is_layer_skipped_gguf", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.gguf.GGUFMoEMethod", "methods": [ { "kind": "function", "name": "GGUFMoEMethod.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GGUFMoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "GGUFMoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GGUFMoEMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GGUFMoEMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 15, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 14, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.gguf.DEQUANT_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.gguf.GGUFUninitializedParameter", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "GGUFUninitializedParameter.cls_to_become", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GGUFUninitializedParameter.data_container", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.gguf.IMATRIX_QUANT_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.gguf.KQUANT_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.gguf.UNQUANTIZED_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.gguf.GGUFConfig", "methods": [ { "kind": "function", "name": "GGUFConfig.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GGUFConfig.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GGUFConfig.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GGUFConfig.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GGUFConfig.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GGUFConfig.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GGUFConfig.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GGUFConfig.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GGUFConfig.apply_vllm_mapper", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GGUFConfig.unquantized_modules", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 13, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.gguf.MMQ_QUANT_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.gguf.GGUFEmbeddingMethod", "methods": [ { "kind": "function", "name": "GGUFEmbeddingMethod.embedding", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.gguf.GGUFLinearMethod", "methods": [ { "kind": "function", "name": "GGUFLinearMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GGUFLinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "GGUFLinearMethod.process_weights_after_loading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GGUFLinearMethod._create_padded_weight_param", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GGUFLinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GGUFLinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 13, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.gguf.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.gguf.MMVQ_QUANT_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.gguf", "names": [ "vllm.model_executor.layers.quantization.gguf.DEQUANT_TYPES", "vllm.model_executor.layers.quantization.gguf.GGUFConfig", "vllm.model_executor.layers.quantization.gguf.GGUFEmbeddingMethod", "vllm.model_executor.layers.quantization.gguf.GGUFLinearMethod", "vllm.model_executor.layers.quantization.gguf.GGUFMoEMethod", "vllm.model_executor.layers.quantization.gguf.GGUFUninitializedParameter", "vllm.model_executor.layers.quantization.gguf.IMATRIX_QUANT_TYPES", "vllm.model_executor.layers.quantization.gguf.KQUANT_TYPES", "vllm.model_executor.layers.quantization.gguf.MMQ_QUANT_TYPES", "vllm.model_executor.layers.quantization.gguf.MMVQ_QUANT_TYPES", "vllm.model_executor.layers.quantization.gguf.STANDARD_QUANT_TYPES", "vllm.model_executor.layers.quantization.gguf.UNQUANTIZED_TYPES", "vllm.model_executor.layers.quantization.gguf.is_layer_skipped_gguf", "vllm.model_executor.layers.quantization.gguf.logger" ], "n_typable": 62, "n_typed": 48, "n_any": 0, "n_untyped": 14, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 34, "n_classes": 5, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/gptq.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.gptq.GPTQLinearMethod", "methods": [ { "kind": "function", "name": "GPTQLinearMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTQLinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "GPTQLinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTQLinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTQLinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQLinearMethod.use_v2_format", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 13, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.gptq.QuantizationMethods", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.gptq.GPTQConfig", "methods": [ { "kind": "function", "name": "GPTQConfig.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "GPTQConfig.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPTQConfig.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPTQConfig.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPTQConfig.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPTQConfig.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPTQConfig.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTQConfig.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPTQConfig.apply_vllm_mapper", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTQConfig.maybe_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTQConfig.dynamic", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQConfig.weight_bits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQConfig.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQConfig.desc_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQConfig.lm_head_quantized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQConfig.pack_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQConfig.modules_in_block_to_quantize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQConfig.autoround_version", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQConfig.checkpoint_format", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 22, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 14, "n_attrs": 9, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.gptq.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.gptq.ExllamaState", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ExllamaState.UNUSED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExllamaState.UNINITIALIZED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExllamaState.READY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.gptq", "names": [ "vllm.model_executor.layers.quantization.gptq.ExllamaState", "vllm.model_executor.layers.quantization.gptq.GPTQConfig", "vllm.model_executor.layers.quantization.gptq.GPTQLinearMethod", "vllm.model_executor.layers.quantization.gptq.QuantizationMethods", "vllm.model_executor.layers.quantization.gptq.logger" ], "n_typable": 52, "n_typed": 35, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 26, "n_classes": 3, "n_attrs": 16, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/gptq_marlin.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.gptq_marlin.GPTQMarlinMoEMethod", "methods": [ { "kind": "function", "name": "GPTQMarlinMoEMethod.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPTQMarlinMoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "GPTQMarlinMoEMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTQMarlinMoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTQMarlinMoEMethod.select_gemm_impl", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPTQMarlinMoEMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTQMarlinMoEMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinMoEMethod.input_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinMoEMethod.use_marlin", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinMoEMethod.quant_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 19, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 17, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.gptq_marlin.GPTQMarlinLinearMethod", "methods": [ { "kind": "function", "name": "GPTQMarlinLinearMethod.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTQMarlinLinearMethod.create_weights", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "GPTQMarlinLinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTQMarlinLinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTQMarlinLinearMethod._kernel_backends_being_used", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinLinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinLinearMethod.input_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinLinearMethod.quant_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 16, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.gptq_marlin.GPTQMarlinConfig", "methods": [ { "kind": "function", "name": "GPTQMarlinConfig.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "GPTQMarlinConfig.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPTQMarlinConfig.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPTQMarlinConfig.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPTQMarlinConfig.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPTQMarlinConfig.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPTQMarlinConfig.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTQMarlinConfig.override_quantization_method", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPTQMarlinConfig.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPTQMarlinConfig.is_gptq_marlin_compatible", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTQMarlinConfig.apply_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTQMarlinConfig.maybe_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTQMarlinConfig.TYPE_MAP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GPTQMarlinConfig.dynamic", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinConfig.weight_bits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinConfig.is_sym", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinConfig.pack_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinConfig.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinConfig.desc_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinConfig.lm_head_quantized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinConfig.full_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinConfig.quant_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinConfig.modules_in_block_to_quantize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTQMarlinConfig.autoround_version", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 23, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 17, "n_attrs": 12, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.gptq_marlin.get_moe_quant_method", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.gptq_marlin.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.gptq_marlin", "names": [ "vllm.model_executor.layers.quantization.gptq_marlin.GPTQMarlinConfig", "vllm.model_executor.layers.quantization.gptq_marlin.GPTQMarlinLinearMethod", "vllm.model_executor.layers.quantization.gptq_marlin.GPTQMarlinMoEMethod", "vllm.model_executor.layers.quantization.gptq_marlin.get_moe_quant_method", "vllm.model_executor.layers.quantization.gptq_marlin.logger" ], "n_typable": 93, "n_typed": 62, "n_any": 0, "n_untyped": 31, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 22, "n_method_overloads": 22, "n_method_params": 46, "n_classes": 3, "n_attrs": 21, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/inc.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.quantization.inc.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.inc.INCConfig", "methods": [ { "kind": "function", "name": "INCConfig.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "INCConfig.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "INCConfig.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "INCConfig.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "INCConfig.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "INCConfig.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "INCConfig.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "INCConfig.get_layer_config", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "INCConfig.check_quantized", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "INCConfig.apply_vllm_mapper", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "INCConfig.apply_awq_quant_layer", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "INCConfig.apply_gptq_quant_layer", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "INCConfig.apply_ipex_quant_layer", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "INCConfig.get_quant_method", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "INCConfig.override_quantization_method", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "INCConfig.SUPPORTED_BITS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "INCConfig.SUPPORTED_DTYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "INCConfig.SUPPORTED_FORMATS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "INCConfig.SUPPORTED_BACKENDS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "INCConfig.weight_bits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "INCConfig.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "INCConfig.sym", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "INCConfig.packing_format", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "INCConfig.block_name_to_quantize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "INCConfig.extra_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "INCConfig.data_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "INCConfig.backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "INCConfig.pack_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 49, "n_typed": 28, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 25, "n_attrs": 13, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.inc", "names": [ "vllm.model_executor.layers.quantization.inc.INCConfig", "vllm.model_executor.layers.quantization.inc.logger" ], "n_typable": 50, "n_typed": 28, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 25, "n_classes": 1, "n_attrs": 14, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/input_quant_fp8.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.input_quant_fp8.QuantFP8", "methods": [ { "kind": "function", "name": "QuantFP8.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "QuantFP8.forward_cuda", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "QuantFP8.forward_hip", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "QuantFP8.forward_native", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "QuantFP8._quantize_group_native", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QuantFP8.static", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuantFP8.group_shape", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuantFP8.use_per_token_if_dynamic", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuantFP8.num_token_padding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuantFP8.column_major_scales", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuantFP8.tma_aligned_scales", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuantFP8.use_ue8m0", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuantFP8.use_deep_gemm_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuantFP8.use_aiter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuantFP8.is_group_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuantFP8.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 36, "n_typed": 23, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 20, "n_attrs": 11, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.input_quant_fp8", "names": [ "vllm.model_executor.layers.quantization.input_quant_fp8.QuantFP8" ], "n_typable": 36, "n_typed": 23, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 20, "n_classes": 1, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/kv_cache.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.quantization.kv_cache.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.kv_cache.BaseKVCacheMethod", "methods": [ { "kind": "function", "name": "BaseKVCacheMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseKVCacheMethod.create_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseKVCacheMethod.apply", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseKVCacheMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseKVCacheMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 6, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.kv_cache", "names": [ "vllm.model_executor.layers.quantization.kv_cache.BaseKVCacheMethod", "vllm.model_executor.layers.quantization.kv_cache.logger" ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/modelopt.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.quantization.modelopt.KV_CACHE_QUANT_ALGOS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.modelopt.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.modelopt.ModelOptFp8PcPtLinearMethod", "methods": [ { "kind": "function", "name": "ModelOptFp8PcPtLinearMethod.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptFp8PcPtLinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "ModelOptFp8PcPtLinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptFp8PcPtLinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelOptFp8PcPtLinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptFp8PcPtLinearMethod.fp8_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 14, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.modelopt.ModelOptMxFp8LinearMethod", "methods": [ { "kind": "function", "name": "ModelOptMxFp8LinearMethod.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptMxFp8LinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "ModelOptMxFp8LinearMethod._process_weights_after_loading_scale_2d", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptMxFp8LinearMethod._process_weights_after_loading_scale_1d", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptMxFp8LinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptMxFp8LinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelOptMxFp8LinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptMxFp8LinearMethod.backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptMxFp8LinearMethod.mxfp8_linear_op", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 19, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.modelopt.ModelOptMixedPrecisionConfig", "methods": [ { "kind": "function", "name": "ModelOptMixedPrecisionConfig.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ModelOptMixedPrecisionConfig.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelOptMixedPrecisionConfig.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelOptMixedPrecisionConfig.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelOptMixedPrecisionConfig.override_quantization_method", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelOptMixedPrecisionConfig._from_config", "n_typed": 6, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ModelOptMixedPrecisionConfig._resolve_quant_algo", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptMixedPrecisionConfig.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelOptMixedPrecisionConfig.apply_vllm_mapper", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelOptMixedPrecisionConfig.kv_cache_quant_method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptMixedPrecisionConfig.quantized_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptMixedPrecisionConfig.fp8_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptMixedPrecisionConfig.nvfp4_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 22, "n_any": 1, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 17, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.modelopt.ModelOptQuantConfigBase", "methods": [ { "kind": "function", "name": "ModelOptQuantConfigBase.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptQuantConfigBase.is_layer_excluded", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptQuantConfigBase.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelOptQuantConfigBase.apply_vllm_mapper", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptQuantConfigBase._extract_modelopt_quant_algo", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptQuantConfigBase.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelOptQuantConfigBase._from_config", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ModelOptQuantConfigBase.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelOptQuantConfigBase.LinearMethodCls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptQuantConfigBase.FusedMoEMethodCls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptQuantConfigBase.KVCacheMethodCls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptQuantConfigBase.exclude_modules", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 24, "n_typed": 22, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 12, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.modelopt.ModelOptFp8PbWoLinearMethod", "methods": [ { "kind": "function", "name": "ModelOptFp8PbWoLinearMethod.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptFp8PbWoLinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "ModelOptFp8PbWoLinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptFp8PbWoLinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelOptFp8PbWoLinearMethod._WEIGHT_BLOCK_SIZE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptFp8PbWoLinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptFp8PbWoLinearMethod.weight_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptFp8PbWoLinearMethod.w8a8_block_fp8_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 15, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.modelopt.ModelOptFp8MoEMethod", "methods": [ { "kind": "function", "name": "ModelOptFp8MoEMethod.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelOptFp8MoEMethod.maybe_make_prepare_finalize", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptFp8MoEMethod.select_gemm_impl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelOptFp8MoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ModelOptFp8MoEMethod._setup_kernel", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "ModelOptFp8MoEMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptFp8MoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptFp8MoEMethod.apply_monolithic", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ModelOptFp8MoEMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelOptFp8MoEMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 38, "n_typed": 34, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 28, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.modelopt.ModelOptNvFp4Config", "methods": [ { "kind": "function", "name": "ModelOptNvFp4Config.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ModelOptNvFp4Config.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelOptNvFp4Config.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelOptNvFp4Config.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelOptNvFp4Config.override_quantization_method", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelOptNvFp4Config._from_config", "n_typed": 6, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelOptNvFp4Config.is_checkpoint_nvfp4_serialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptNvFp4Config.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptNvFp4Config.kv_cache_quant_algo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 15, "n_any": 1, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.modelopt.ModelOptNvFp4LinearMethod", "methods": [ { "kind": "function", "name": "ModelOptNvFp4LinearMethod.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptNvFp4LinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "ModelOptNvFp4LinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptNvFp4LinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelOptNvFp4LinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptNvFp4LinearMethod.marlin_input_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptNvFp4LinearMethod.backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 14, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.modelopt.ModelOptMxFp8Config", "methods": [ { "kind": "function", "name": "ModelOptMxFp8Config.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ModelOptMxFp8Config.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelOptMxFp8Config.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelOptMxFp8Config.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelOptMxFp8Config.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelOptMxFp8Config.override_quantization_method", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelOptMxFp8Config._from_config", "n_typed": 5, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelOptMxFp8Config.is_checkpoint_mxfp8_serialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptMxFp8Config.kv_cache_quant_algo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 16, "n_any": 1, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 12, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.modelopt.ModelOptFp8KVCacheMethod", "methods": [ { "kind": "function", "name": "ModelOptFp8KVCacheMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.modelopt.QUANT_ALGOS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.modelopt.ModelOptFp8Config", "methods": [ { "kind": "function", "name": "ModelOptFp8Config.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ModelOptFp8Config.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelOptFp8Config.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelOptFp8Config.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelOptFp8Config.override_quantization_method", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelOptFp8Config._from_config", "n_typed": 5, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelOptFp8Config.quant_method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptFp8Config.is_checkpoint_fp8_serialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptFp8Config.kv_cache_quant_method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 14, "n_any": 1, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 11, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.modelopt.ModelOptFp8LinearMethod", "methods": [ { "kind": "function", "name": "ModelOptFp8LinearMethod.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptFp8LinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "ModelOptFp8LinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptFp8LinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelOptFp8LinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptFp8LinearMethod.fp8_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 14, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.modelopt.ModelOptNvFp4FusedMoE", "methods": [ { "kind": "function", "name": "ModelOptNvFp4FusedMoE.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelOptNvFp4FusedMoE.maybe_make_prepare_finalize", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptNvFp4FusedMoE.uses_weight_scale_2_pattern", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelOptNvFp4FusedMoE.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ModelOptNvFp4FusedMoE.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptNvFp4FusedMoE.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelOptNvFp4FusedMoE.apply_monolithic", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ModelOptNvFp4FusedMoE.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [ { "kind": "property", "name": "ModelOptNvFp4FusedMoE.supports_eplb", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ModelOptNvFp4FusedMoE.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelOptNvFp4FusedMoE.use_global_sf", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 26, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 19, "n_attrs": 2, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.modelopt", "names": [ "vllm.model_executor.layers.quantization.modelopt.KV_CACHE_QUANT_ALGOS", "vllm.model_executor.layers.quantization.modelopt.ModelOptFp8Config", "vllm.model_executor.layers.quantization.modelopt.ModelOptFp8KVCacheMethod", "vllm.model_executor.layers.quantization.modelopt.ModelOptFp8LinearMethod", "vllm.model_executor.layers.quantization.modelopt.ModelOptFp8MoEMethod", "vllm.model_executor.layers.quantization.modelopt.ModelOptFp8PbWoLinearMethod", "vllm.model_executor.layers.quantization.modelopt.ModelOptFp8PcPtLinearMethod", "vllm.model_executor.layers.quantization.modelopt.ModelOptMixedPrecisionConfig", "vllm.model_executor.layers.quantization.modelopt.ModelOptMxFp8Config", "vllm.model_executor.layers.quantization.modelopt.ModelOptMxFp8LinearMethod", "vllm.model_executor.layers.quantization.modelopt.ModelOptNvFp4Config", "vllm.model_executor.layers.quantization.modelopt.ModelOptNvFp4FusedMoE", "vllm.model_executor.layers.quantization.modelopt.ModelOptNvFp4LinearMethod", "vllm.model_executor.layers.quantization.modelopt.ModelOptQuantConfigBase", "vllm.model_executor.layers.quantization.modelopt.QUANT_ALGOS", "vllm.model_executor.layers.quantization.modelopt.logger" ], "n_typable": 285, "n_typed": 226, "n_any": 4, "n_untyped": 55, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 76, "n_method_overloads": 76, "n_method_params": 174, "n_classes": 13, "n_attrs": 36, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/moe_wna16.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.moe_wna16.MoeWNA16Config", "methods": [ { "kind": "function", "name": "MoeWNA16Config.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "MoeWNA16Config.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoeWNA16Config.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoeWNA16Config.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoeWNA16Config.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoeWNA16Config.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoeWNA16Config.override_quantization_method", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoeWNA16Config.is_moe_wna16_compatible", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoeWNA16Config.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoeWNA16Config.weight_bits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoeWNA16Config.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoeWNA16Config.has_zp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoeWNA16Config.bit8_pack_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoeWNA16Config.lm_head_quantized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoeWNA16Config.linear_quant_method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoeWNA16Config.full_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoeWNA16Config.use_marlin", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoeWNA16Config.modules_to_not_convert", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 19, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 13, "n_attrs": 9, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.moe_wna16.is_layer_skipped_quant", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.moe_wna16.MoeWNA16Method", "methods": [ { "kind": "function", "name": "MoeWNA16Method.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoeWNA16Method.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MoeWNA16Method.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MoeWNA16Method.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MoeWNA16Method.get_weight_loader", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoeWNA16Method.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 16, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 16, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.moe_wna16", "names": [ "vllm.model_executor.layers.quantization.moe_wna16.MoeWNA16Config", "vllm.model_executor.layers.quantization.moe_wna16.MoeWNA16Method", "vllm.model_executor.layers.quantization.moe_wna16.is_layer_skipped_quant" ], "n_typable": 56, "n_typed": 37, "n_any": 0, "n_untyped": 19, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 29, "n_classes": 2, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/mxfp4.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.mxfp4.get_mxfp4_backend_with_lora", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.mxfp4.get_mxfp4_backend", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.mxfp4.XpuMxfp4MoEMethod", "methods": [ { "kind": "function", "name": "XpuMxfp4MoEMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XpuMxfp4MoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "XpuMxfp4MoEMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XpuMxfp4MoEMethod.apply_monolithic", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "XpuMxfp4MoEMethod.is_monolithic", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "XpuMxfp4MoEMethod.moe_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 13, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 1, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.mxfp4.Mxfp4Backend", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Mxfp4Backend.NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Mxfp4Backend.SM100_FI_MXFP4_MXFP8_TRTLLM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Mxfp4Backend.SM100_FI_MXFP4_MXFP8_CUTLASS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Mxfp4Backend.SM100_FI_MXFP4_BF16", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Mxfp4Backend.SM90_FI_MXFP4_BF16", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Mxfp4Backend.MARLIN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Mxfp4Backend.TRITON", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Mxfp4Backend.CK", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.mxfp4.Mxfp4Config", "methods": [ { "kind": "function", "name": "Mxfp4Config.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mxfp4Config.from_config", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mxfp4Config.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Mxfp4Config.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Mxfp4Config.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Mxfp4Config.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Mxfp4Config.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Mxfp4Config.is_mxfp4_quant", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Mxfp4Config.ignored_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 11, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.mxfp4.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.mxfp4.Mxfp4MoEMethod", "methods": [ { "kind": "function", "name": "Mxfp4MoEMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mxfp4MoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Mxfp4MoEMethod.process_weights_after_loading", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mxfp4MoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mxfp4MoEMethod.select_gemm_impl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Mxfp4MoEMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Mxfp4MoEMethod.apply_monolithic", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "Mxfp4MoEMethod.is_monolithic", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Mxfp4MoEMethod.weight_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mxfp4MoEMethod.mxfp4_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mxfp4MoEMethod.max_capture_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mxfp4MoEMethod.moe_kernel", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 31, "n_typed": 23, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 19, "n_attrs": 4, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.mxfp4", "names": [ "vllm.model_executor.layers.quantization.mxfp4.Mxfp4Backend", "vllm.model_executor.layers.quantization.mxfp4.Mxfp4Config", "vllm.model_executor.layers.quantization.mxfp4.Mxfp4MoEMethod", "vllm.model_executor.layers.quantization.mxfp4.XpuMxfp4MoEMethod", "vllm.model_executor.layers.quantization.mxfp4.get_mxfp4_backend", "vllm.model_executor.layers.quantization.mxfp4.get_mxfp4_backend_with_lora", "vllm.model_executor.layers.quantization.mxfp4.logger" ], "n_typable": 67, "n_typed": 50, "n_any": 0, "n_untyped": 17, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 1, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 36, "n_classes": 4, "n_attrs": 15, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/petit.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.petit.PetitNvFp4LinearMethod", "methods": [ { "kind": "function", "name": "PetitNvFp4LinearMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PetitNvFp4LinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "PetitNvFp4LinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PetitNvFp4LinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PetitNvFp4LinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 13, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.petit.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.petit.PetitFp8KVCacheMethod", "methods": [ { "kind": "function", "name": "PetitFp8KVCacheMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.petit.PetitNvFp4Config", "methods": [ { "kind": "function", "name": "PetitNvFp4Config.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PetitNvFp4Config._check_hardware_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PetitNvFp4Config.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PetitNvFp4Config.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PetitNvFp4Config.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PetitNvFp4Config.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PetitNvFp4Config.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PetitNvFp4Config.override_quantization_method", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PetitNvFp4Config.is_petit_nvfp4_compatible", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PetitNvFp4Config.is_layer_excluded", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PetitNvFp4Config.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PetitNvFp4Config.get_scaled_act_names", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PetitNvFp4Config.require_group_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PetitNvFp4Config.require_kv_cache_quant_algo", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PetitNvFp4Config.require_exclude_modules", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PetitNvFp4Config.is_checkpoint_nvfp4_serialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PetitNvFp4Config.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PetitNvFp4Config.kv_cache_quant_algo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PetitNvFp4Config.exclude_modules", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 25, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 12, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.petit", "names": [ "vllm.model_executor.layers.quantization.petit.PetitFp8KVCacheMethod", "vllm.model_executor.layers.quantization.petit.PetitNvFp4Config", "vllm.model_executor.layers.quantization.petit.PetitNvFp4LinearMethod", "vllm.model_executor.layers.quantization.petit.logger" ], "n_typable": 51, "n_typed": 39, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 20, "n_method_overloads": 20, "n_method_params": 25, "n_classes": 3, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/ptpc_fp8.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.ptpc_fp8.PTPCFp8Config", "methods": [ { "kind": "function", "name": "PTPCFp8Config.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PTPCFp8Config.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PTPCFp8Config.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PTPCFp8Config.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.ptpc_fp8.PTPCFp8LinearMethod", "methods": [ { "kind": "function", "name": "PTPCFp8LinearMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PTPCFp8LinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PTPCFp8LinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PTPCFp8LinearMethod.fp8_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.ptpc_fp8", "names": [ "vllm.model_executor.layers.quantization.ptpc_fp8.PTPCFp8Config", "vllm.model_executor.layers.quantization.ptpc_fp8.PTPCFp8LinearMethod" ], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 10, "n_classes": 2, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/quark/quark.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.quark.quark.QuarkLinearMethod", "methods": [ { "kind": "function", "name": "QuarkLinearMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuarkLinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuarkLinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "QuarkLinearMethod.apply", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QuarkLinearMethod.quantization_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.quark.quark", "names": [ "vllm.model_executor.layers.quantization.quark.quark.QuarkLinearMethod" ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/quark/quark_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.quark.quark_moe.QuarkMoEMethod", "methods": [ { "kind": "function", "name": "QuarkMoEMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuarkMoEMethod.get_moe_method", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QuarkMoEMethod.has_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.quark.quark_moe.QuarkOCP_MX_MoEMethod_OSS", "methods": [ { "kind": "function", "name": "QuarkOCP_MX_MoEMethod_OSS.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "QuarkOCP_MX_MoEMethod_OSS.process_weights_after_loading", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuarkOCP_MX_MoEMethod_OSS.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuarkOCP_MX_MoEMethod_OSS.apply_monolithic", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "QuarkOCP_MX_MoEMethod_OSS.is_monolithic", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 14, "n_typed": 11, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.quark.quark_moe.QuarkOCP_MX_MoEMethod", "methods": [ { "kind": "function", "name": "QuarkOCP_MX_MoEMethod.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "QuarkOCP_MX_MoEMethod.get_packed_dim", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QuarkOCP_MX_MoEMethod.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "QuarkOCP_MX_MoEMethod.process_weights_after_loading", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuarkOCP_MX_MoEMethod.get_fused_moe_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuarkOCP_MX_MoEMethod.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QuarkOCP_MX_MoEMethod.weight_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX_MoEMethod.input_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX_MoEMethod.weight_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX_MoEMethod.fp4_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX_MoEMethod.ocp_mx_scheme", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX_MoEMethod.mxfp4_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX_MoEMethod.use_rocm_aiter_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX_MoEMethod.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX_MoEMethod.emulate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX_MoEMethod.static_input_scales", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX_MoEMethod.input_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 19, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 18, "n_attrs": 11, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.quark.quark_moe", "names": [ "vllm.model_executor.layers.quantization.quark.quark_moe.QuarkMoEMethod", "vllm.model_executor.layers.quantization.quark.quark_moe.QuarkOCP_MX_MoEMethod", "vllm.model_executor.layers.quantization.quark.quark_moe.QuarkOCP_MX_MoEMethod_OSS" ], "n_typable": 56, "n_typed": 35, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 31, "n_classes": 3, "n_attrs": 12, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/quark/schemes/quark_ocp_mx.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.quark.schemes.quark_ocp_mx.QuarkOCP_MX", "methods": [ { "kind": "function", "name": "QuarkOCP_MX.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "QuarkOCP_MX.get_packed_dim", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QuarkOCP_MX.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QuarkOCP_MX.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuarkOCP_MX.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "QuarkOCP_MX.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QuarkOCP_MX.out_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX.qscheme", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX.weight_quant_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX.input_quant_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX.dynamic_mxfp4_quant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX.weight_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX.input_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX.ocp_mx_scheme", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX.static_input_scales", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX.emulate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX.rocm_use_aiter_fp4_asm_gemm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX.packed_factor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX.dequant_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkOCP_MX.quant_dequant_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 18, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_attrs": 14, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.quark.schemes.quark_ocp_mx.gemm_with_dynamic_quant_fake", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.quark.schemes.quark_ocp_mx.gemm_with_dynamic_quant", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.quark.schemes.quark_ocp_mx.is_rocm_aiter_fp4_asm_gemm_enabled", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.quark.schemes.quark_ocp_mx.dynamic_mxfp4_quant", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.quark.schemes.quark_ocp_mx.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.quark.schemes.quark_ocp_mx.gemm_afp4wfp4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.quark.schemes.quark_ocp_mx", "names": [ "vllm.model_executor.layers.quantization.quark.schemes.quark_ocp_mx.QuarkOCP_MX", "vllm.model_executor.layers.quantization.quark.schemes.quark_ocp_mx.dynamic_mxfp4_quant", "vllm.model_executor.layers.quantization.quark.schemes.quark_ocp_mx.gemm_afp4wfp4", "vllm.model_executor.layers.quantization.quark.schemes.quark_ocp_mx.gemm_with_dynamic_quant", "vllm.model_executor.layers.quantization.quark.schemes.quark_ocp_mx.gemm_with_dynamic_quant_fake", "vllm.model_executor.layers.quantization.quark.schemes.quark_ocp_mx.is_rocm_aiter_fp4_asm_gemm_enabled", "vllm.model_executor.layers.quantization.quark.schemes.quark_ocp_mx.logger" ], "n_typable": 51, "n_typed": 33, "n_any": 0, "n_untyped": 18, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 12, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_classes": 1, "n_attrs": 17, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/quark/schemes/quark_scheme.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.quark.schemes.quark_scheme.QuarkScheme", "methods": [ { "kind": "function", "name": "QuarkScheme.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QuarkScheme.create_weights", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QuarkScheme.apply_weights", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "QuarkScheme.process_weights_after_loading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.quark.schemes.quark_scheme", "names": [ "vllm.model_executor.layers.quantization.quark.schemes.quark_scheme.QuarkScheme" ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/quark/schemes/quark_w8a8_fp8.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.quark.schemes.quark_w8a8_fp8.QuarkW8A8Fp8", "methods": [ { "kind": "function", "name": "QuarkW8A8Fp8.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QuarkW8A8Fp8.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QuarkW8A8Fp8.process_weights_after_loading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuarkW8A8Fp8.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "QuarkW8A8Fp8.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QuarkW8A8Fp8.weight_qscheme", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkW8A8Fp8.is_static_input_scheme", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "QuarkW8A8Fp8.input_qscheme", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "QuarkW8A8Fp8.activation_quant_key", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkW8A8Fp8.weight_quant_key", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkW8A8Fp8.out_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 15, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.quark.schemes.quark_w8a8_fp8", "names": [ "vllm.model_executor.layers.quantization.quark.schemes.quark_w8a8_fp8.QuarkW8A8Fp8" ], "n_typable": 23, "n_typed": 15, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/quark/schemes/quark_w8a8_int8.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.quark.schemes.quark_w8a8_int8.QuarkW8A8Int8", "methods": [ { "kind": "function", "name": "QuarkW8A8Int8.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "QuarkW8A8Int8.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QuarkW8A8Int8.create_weights", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "QuarkW8A8Int8.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QuarkW8A8Int8.apply_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QuarkW8A8Int8.qscheme", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkW8A8Int8.is_static_input_scheme", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuarkW8A8Int8.input_symmetric", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 15, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.quark.schemes.quark_w8a8_int8.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.quark.schemes.quark_w8a8_int8", "names": [ "vllm.model_executor.layers.quantization.quark.schemes.quark_w8a8_int8.QuarkW8A8Int8", "vllm.model_executor.layers.quantization.quark.schemes.quark_w8a8_int8.logger" ], "n_typable": 22, "n_typed": 15, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/quark/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.quark.utils.should_ignore_layer", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.quark.utils.deep_compare", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.quark.utils.check_equal_or_regex_match", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.quark.utils.quark_quantize_weight_to_mxfp4", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.quark.utils", "names": [ "vllm.model_executor.layers.quantization.quark.utils.check_equal_or_regex_match", "vllm.model_executor.layers.quantization.quark.utils.deep_compare", "vllm.model_executor.layers.quantization.quark.utils.quark_quantize_weight_to_mxfp4", "vllm.model_executor.layers.quantization.quark.utils.should_ignore_layer" ], "n_typable": 12, "n_typed": 9, "n_any": 2, "n_untyped": 1, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 8, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/qutlass_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.qutlass_utils.to_blocked", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.qutlass_utils.triton_scale_swizzle", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.qutlass_utils.triton_mx_block_rearrange", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.qutlass_utils", "names": [ "vllm.model_executor.layers.quantization.qutlass_utils.to_blocked", "vllm.model_executor.layers.quantization.qutlass_utils.triton_mx_block_rearrange", "vllm.model_executor.layers.quantization.qutlass_utils.triton_scale_swizzle" ], "n_typable": 14, "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 11, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/schema.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.schema.QuantParamSchema", "methods": [ { "kind": "function", "name": "QuantParamSchema.check_model_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QuantParamSchema.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QuantParamSchema.model_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "QuantParamSchema.kv_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.schema.KVCacheQuantSchema", "methods": [ { "kind": "function", "name": "KVCacheQuantSchema.check_is_fp8", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVCacheQuantSchema.check_tp_ranks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheQuantSchema.check_current_rank", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KVCacheQuantSchema.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheQuantSchema.scaling_factor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.schema", "names": [ "vllm.model_executor.layers.quantization.schema.KVCacheQuantSchema", "vllm.model_executor.layers.quantization.schema.QuantParamSchema" ], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_classes": 2, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/torchao.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.quantization.torchao.convert_to_packed_tensor_based_on_current_hardware", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.torchao.TorchAOLinearMethod", "methods": [ { "kind": "function", "name": "TorchAOLinearMethod.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TorchAOLinearMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "TorchAOLinearMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TorchAOLinearMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TorchAOLinearMethod.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 13, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.torchao.TorchAOConfig", "methods": [ { "kind": "function", "name": "TorchAOConfig.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TorchAOConfig.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TorchAOConfig.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TorchAOConfig.get_supported_act_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TorchAOConfig.get_min_capability", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TorchAOConfig.get_config_filenames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TorchAOConfig.from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TorchAOConfig.from_config_file", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TorchAOConfig.from_config_dict_json", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TorchAOConfig.get_quant_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TorchAOConfig.get_scaled_act_names", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TorchAOConfig.torchao_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TorchAOConfig.skip_modules", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TorchAOConfig.is_checkpoint_torchao_serialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 18, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.torchao.should_skip", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.torchao.torchao_quantize_param_data", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.torchao.torchao_version_at_least", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.torchao.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.torchao", "names": [ "vllm.model_executor.layers.quantization.torchao.TorchAOConfig", "vllm.model_executor.layers.quantization.torchao.TorchAOLinearMethod", "vllm.model_executor.layers.quantization.torchao.convert_to_packed_tensor_based_on_current_hardware", "vllm.model_executor.layers.quantization.torchao.logger", "vllm.model_executor.layers.quantization.torchao.should_skip", "vllm.model_executor.layers.quantization.torchao.torchao_quantize_param_data", "vllm.model_executor.layers.quantization.torchao.torchao_version_at_least" ], "n_typable": 48, "n_typed": 38, "n_any": 1, "n_untyped": 9, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 5, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 20, "n_classes": 2, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/layer_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.layer_utils.replace_parameter", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.layer_utils.update_tensor_inplace", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.layer_utils", "names": [ "vllm.model_executor.layers.quantization.utils.layer_utils.replace_parameter", "vllm.model_executor.layers.quantization.utils.layer_utils.update_tensor_inplace" ], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 5, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/allspark_utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.allspark_utils.ALLSPARK_AMPERE_K_ALIGN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.allspark_utils.ALLSPARK_SUPPORTED_QUANT_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.allspark_utils.ALLSPARK_AMPERE_N_ALIGN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.allspark_utils.check_allspark_supported_dtype_shape", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.allspark_utils.ALLSPARK_AMPERE_M_CUBLAS_THRESHOLD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.allspark_utils", "names": [ "vllm.model_executor.layers.quantization.utils.allspark_utils.ALLSPARK_AMPERE_K_ALIGN", "vllm.model_executor.layers.quantization.utils.allspark_utils.ALLSPARK_AMPERE_M_CUBLAS_THRESHOLD", "vllm.model_executor.layers.quantization.utils.allspark_utils.ALLSPARK_AMPERE_N_ALIGN", "vllm.model_executor.layers.quantization.utils.allspark_utils.ALLSPARK_SUPPORTED_QUANT_TYPES", "vllm.model_executor.layers.quantization.utils.allspark_utils.check_allspark_supported_dtype_shape" ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 5, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/flashinfer_fp4_moe.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_fp4_moe.reorder_w1w3_to_w3w1", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.flashinfer_fp4_moe", "names": [ "vllm.model_executor.layers.quantization.utils.flashinfer_fp4_moe.reorder_w1w3_to_w3w1" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/flashinfer_mxint4_moe.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_mxint4_moe.flashinfer_trtllm_mxint4_moe", "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_mxint4_moe.is_flashinfer_mxint4_moe_available", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_mxint4_moe.prepare_static_weights_for_trtllm_mxint4_moe", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.flashinfer_mxint4_moe", "names": [ "vllm.model_executor.layers.quantization.utils.flashinfer_mxint4_moe.flashinfer_trtllm_mxint4_moe", "vllm.model_executor.layers.quantization.utils.flashinfer_mxint4_moe.is_flashinfer_mxint4_moe_available", "vllm.model_executor.layers.quantization.utils.flashinfer_mxint4_moe.prepare_static_weights_for_trtllm_mxint4_moe" ], "n_typable": 22, "n_typed": 22, "n_any": 0, "n_untyped": 0, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 19, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/flashinfer_utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_utils.FlashinferMoeBackend", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashinferMoeBackend.TENSORRT_LLM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashinferMoeBackend.CUTLASS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashinferMoeBackend.CUTEDSL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_utils.convert_moe_weights_to_flashinfer_trtllm_block_layout", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_utils.prepare_fp8_moe_layer_for_fi", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_utils.swap_w13_to_w31", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_utils.align_fp4_moe_weights_for_fi", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_utils.align_fp8_moe_weights_for_fi", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_utils.activation_to_flashinfer_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_utils.activation_to_flashinfer_int", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_utils.rotate_weights_for_fi_trtllm_fp8_per_tensor_moe", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_utils.is_flashinfer_supporting_global_sf", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.flashinfer_utils.get_flashinfer_moe_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.flashinfer_utils", "names": [ "vllm.model_executor.layers.quantization.utils.flashinfer_utils.FlashinferMoeBackend", "vllm.model_executor.layers.quantization.utils.flashinfer_utils.activation_to_flashinfer_int", "vllm.model_executor.layers.quantization.utils.flashinfer_utils.activation_to_flashinfer_type", "vllm.model_executor.layers.quantization.utils.flashinfer_utils.align_fp4_moe_weights_for_fi", "vllm.model_executor.layers.quantization.utils.flashinfer_utils.align_fp8_moe_weights_for_fi", "vllm.model_executor.layers.quantization.utils.flashinfer_utils.convert_moe_weights_to_flashinfer_trtllm_block_layout", "vllm.model_executor.layers.quantization.utils.flashinfer_utils.get_flashinfer_moe_backend", "vllm.model_executor.layers.quantization.utils.flashinfer_utils.is_flashinfer_supporting_global_sf", "vllm.model_executor.layers.quantization.utils.flashinfer_utils.logger", "vllm.model_executor.layers.quantization.utils.flashinfer_utils.prepare_fp8_moe_layer_for_fi", "vllm.model_executor.layers.quantization.utils.flashinfer_utils.rotate_weights_for_fi_trtllm_fp8_per_tensor_moe", "vllm.model_executor.layers.quantization.utils.flashinfer_utils.swap_w13_to_w31" ], "n_typable": 39, "n_typed": 37, "n_any": 0, "n_untyped": 2, "n_functions": 10, "n_function_overloads": 10, "n_function_params": 28, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/fp8_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.prepare_fp8_moe_layer_for_deepgemm", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.is_fp8", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.maybe_post_process_fp8_weight_block", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.requant_weight_ue8m0_inplace", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.create_fp8_scale_parameter", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.create_fp8_weight_parameter", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.deepgemm_post_process_fp8_weight_block", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.process_fp8_weight_tensor_strategy", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.process_fp8_input_tensor_strategy_moe", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.create_fp8_input_scale", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.process_fp8_weight_tensor_strategy_moe", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.validate_fp8_block_shape", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.input_to_float8", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.get_w8a8_block_fp8_configs", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.cutlass_scaled_mm", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.per_token_group_quant_fp8_packed_for_deepgemm", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.process_fp8_weight_block_strategy", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.W8A8BlockFp8LinearOp", "methods": [ { "kind": "function", "name": "W8A8BlockFp8LinearOp.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "W8A8BlockFp8LinearOp.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "W8A8BlockFp8LinearOp._run_deepgemm", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "W8A8BlockFp8LinearOp._run_cutlass", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "W8A8BlockFp8LinearOp._run_aiter", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "W8A8BlockFp8LinearOp._run_triton", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "W8A8BlockFp8LinearOp._run_flashinfer", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "W8A8BlockFp8LinearOp._dispatch_w8a8_blockscale_op", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "W8A8BlockFp8LinearOp.weight_group_shape", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "W8A8BlockFp8LinearOp.act_quant_group_shape", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "W8A8BlockFp8LinearOp.is_deep_gemm_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "W8A8BlockFp8LinearOp.is_hopper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "W8A8BlockFp8LinearOp.use_deep_gemm_e8m0", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "W8A8BlockFp8LinearOp.is_flashinfer_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "W8A8BlockFp8LinearOp.deepgemm_input_quant_op", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 44, "n_typed": 36, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 29, "n_attrs": 7, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.silu_mul_per_token_group_quant_fp8_colmajor", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.per_token_group_quant_fp8", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.w8a8_triton_block_scaled_mm", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.process_fp8_weight_channel_strategy", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.fp8_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.fp8_utils", "names": [ "vllm.model_executor.layers.quantization.utils.fp8_utils.W8A8BlockFp8LinearOp", "vllm.model_executor.layers.quantization.utils.fp8_utils.create_fp8_input_scale", "vllm.model_executor.layers.quantization.utils.fp8_utils.create_fp8_scale_parameter", "vllm.model_executor.layers.quantization.utils.fp8_utils.create_fp8_weight_parameter", "vllm.model_executor.layers.quantization.utils.fp8_utils.cutlass_scaled_mm", "vllm.model_executor.layers.quantization.utils.fp8_utils.deepgemm_post_process_fp8_weight_block", "vllm.model_executor.layers.quantization.utils.fp8_utils.get_w8a8_block_fp8_configs", "vllm.model_executor.layers.quantization.utils.fp8_utils.input_to_float8", "vllm.model_executor.layers.quantization.utils.fp8_utils.is_fp8", "vllm.model_executor.layers.quantization.utils.fp8_utils.logger", "vllm.model_executor.layers.quantization.utils.fp8_utils.maybe_post_process_fp8_weight_block", "vllm.model_executor.layers.quantization.utils.fp8_utils.per_token_group_quant_fp8", "vllm.model_executor.layers.quantization.utils.fp8_utils.per_token_group_quant_fp8_packed_for_deepgemm", "vllm.model_executor.layers.quantization.utils.fp8_utils.prepare_fp8_moe_layer_for_deepgemm", "vllm.model_executor.layers.quantization.utils.fp8_utils.process_fp8_input_tensor_strategy_moe", "vllm.model_executor.layers.quantization.utils.fp8_utils.process_fp8_weight_block_strategy", "vllm.model_executor.layers.quantization.utils.fp8_utils.process_fp8_weight_channel_strategy", "vllm.model_executor.layers.quantization.utils.fp8_utils.process_fp8_weight_tensor_strategy", "vllm.model_executor.layers.quantization.utils.fp8_utils.process_fp8_weight_tensor_strategy_moe", "vllm.model_executor.layers.quantization.utils.fp8_utils.requant_weight_ue8m0_inplace", "vllm.model_executor.layers.quantization.utils.fp8_utils.silu_mul_per_token_group_quant_fp8_colmajor", "vllm.model_executor.layers.quantization.utils.fp8_utils.validate_fp8_block_shape", "vllm.model_executor.layers.quantization.utils.fp8_utils.w8a8_triton_block_scaled_mm" ], "n_typable": 147, "n_typed": 135, "n_any": 0, "n_untyped": 12, "n_functions": 21, "n_function_overloads": 21, "n_function_params": 81, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 29, "n_classes": 1, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/gptq_utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.gptq_utils.GPTQMarlinConfig", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.gptq_utils.GPTQConfig", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.gptq_utils.get_dynamic_override", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.gptq_utils.override_config", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.gptq_utils.get_linear_quant_method", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.gptq_utils.is_layer_gptq_quantized", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.gptq_utils", "names": [ "vllm.model_executor.layers.quantization.utils.gptq_utils.GPTQConfig", "vllm.model_executor.layers.quantization.utils.gptq_utils.GPTQMarlinConfig", "vllm.model_executor.layers.quantization.utils.gptq_utils.get_dynamic_override", "vllm.model_executor.layers.quantization.utils.gptq_utils.get_linear_quant_method", "vllm.model_executor.layers.quantization.utils.gptq_utils.is_layer_gptq_quantized", "vllm.model_executor.layers.quantization.utils.gptq_utils.override_config" ], "n_typable": 17, "n_typed": 15, "n_any": 0, "n_untyped": 2, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 13, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/int8_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.int8_utils.round_int8", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.int8_utils.input_to_int8", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.int8_utils.get_w8a8_block_int8_configs", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.int8_utils.block_dequant", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.int8_utils.w8a8_block_int8_matmul", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.int8_utils.per_token_group_quant_int8", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.int8_utils.per_token_quant_int8", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.int8_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.int8_utils.apply_w8a8_block_int8_linear", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.int8_utils", "names": [ "vllm.model_executor.layers.quantization.utils.int8_utils.apply_w8a8_block_int8_linear", "vllm.model_executor.layers.quantization.utils.int8_utils.block_dequant", "vllm.model_executor.layers.quantization.utils.int8_utils.get_w8a8_block_int8_configs", "vllm.model_executor.layers.quantization.utils.int8_utils.input_to_int8", "vllm.model_executor.layers.quantization.utils.int8_utils.logger", "vllm.model_executor.layers.quantization.utils.int8_utils.per_token_group_quant_int8", "vllm.model_executor.layers.quantization.utils.int8_utils.per_token_quant_int8", "vllm.model_executor.layers.quantization.utils.int8_utils.round_int8", "vllm.model_executor.layers.quantization.utils.int8_utils.w8a8_block_int8_matmul" ], "n_typable": 36, "n_typed": 31, "n_any": 0, "n_untyped": 5, "n_functions": 8, "n_function_overloads": 8, "n_function_params": 27, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/machete_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.machete_utils.query_machete_supported_group_sizes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.machete_utils.MACHETE_PREPACKED_BLOCK_SHAPE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.machete_utils.query_machete_supported_act_types", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.machete_utils.query_machete_supported_quant_types", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.machete_utils.check_machete_supports_shape", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.machete_utils", "names": [ "vllm.model_executor.layers.quantization.utils.machete_utils.MACHETE_PREPACKED_BLOCK_SHAPE", "vllm.model_executor.layers.quantization.utils.machete_utils.check_machete_supports_shape", "vllm.model_executor.layers.quantization.utils.machete_utils.query_machete_supported_act_types", "vllm.model_executor.layers.quantization.utils.machete_utils.query_machete_supported_group_sizes", "vllm.model_executor.layers.quantization.utils.machete_utils.query_machete_supported_quant_types" ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 5, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/marlin_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_zero_points", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_moe_intermediate_size", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_make_empty_g_idx", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.GPTQ_MARLIN_TILE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_moe_permute_scales", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.check_marlin_supported", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_make_workspace_new", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.check_marlin_supports_layer", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.MARLIN_SUPPORTED_GROUP_SIZES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.check_marlin_supports_shape", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_permute_scales", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.get_scale_perms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.GPTQ_MARLIN_MIN_THREAD_N", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.should_use_atomic_add_reduce", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.GPTQ_MARLIN_MAX_PARALLEL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.apply_gptq_marlin_linear", "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.verify_marlin_supports_shape", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.maybe_warn_marlin_atomic_add", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.awq_to_marlin_zero_points", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.get_marlin_input_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_quant_input", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.apply_awq_marlin_linear", "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.query_marlin_supported_quant_types", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.GPTQ_MARLIN_MIN_THREAD_K", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.USE_FP32_REDUCE_DEFAULT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_act_int8_process_scales", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_sort_g_idx", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_permute_bias", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.maybe_warn_marlin_atomic_add_env", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_is_k_full", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.moe_awq_to_marlin_zero_points", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.get__quant_fp8_method", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.verify_marlin_supported", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_repeat_scales_on_all_ranks", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils.check_moe_marlin_supports_layer", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.marlin_utils", "names": [ "vllm.model_executor.layers.quantization.utils.marlin_utils.GPTQ_MARLIN_MAX_PARALLEL", "vllm.model_executor.layers.quantization.utils.marlin_utils.GPTQ_MARLIN_MIN_THREAD_K", "vllm.model_executor.layers.quantization.utils.marlin_utils.GPTQ_MARLIN_MIN_THREAD_N", "vllm.model_executor.layers.quantization.utils.marlin_utils.GPTQ_MARLIN_TILE", "vllm.model_executor.layers.quantization.utils.marlin_utils.MARLIN_SUPPORTED_GROUP_SIZES", "vllm.model_executor.layers.quantization.utils.marlin_utils.USE_FP32_REDUCE_DEFAULT", "vllm.model_executor.layers.quantization.utils.marlin_utils.apply_awq_marlin_linear", "vllm.model_executor.layers.quantization.utils.marlin_utils.apply_gptq_marlin_linear", "vllm.model_executor.layers.quantization.utils.marlin_utils.awq_to_marlin_zero_points", "vllm.model_executor.layers.quantization.utils.marlin_utils.check_marlin_supported", "vllm.model_executor.layers.quantization.utils.marlin_utils.check_marlin_supports_layer", "vllm.model_executor.layers.quantization.utils.marlin_utils.check_marlin_supports_shape", "vllm.model_executor.layers.quantization.utils.marlin_utils.check_moe_marlin_supports_layer", "vllm.model_executor.layers.quantization.utils.marlin_utils.get__quant_fp8_method", "vllm.model_executor.layers.quantization.utils.marlin_utils.get_marlin_input_dtype", "vllm.model_executor.layers.quantization.utils.marlin_utils.get_scale_perms", "vllm.model_executor.layers.quantization.utils.marlin_utils.logger", "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_act_int8_process_scales", "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_is_k_full", "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_make_empty_g_idx", "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_make_workspace_new", "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_moe_intermediate_size", "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_moe_permute_scales", "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_permute_bias", "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_permute_scales", "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_quant_input", "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_repeat_scales_on_all_ranks", "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_sort_g_idx", "vllm.model_executor.layers.quantization.utils.marlin_utils.marlin_zero_points", "vllm.model_executor.layers.quantization.utils.marlin_utils.maybe_warn_marlin_atomic_add", "vllm.model_executor.layers.quantization.utils.marlin_utils.maybe_warn_marlin_atomic_add_env", "vllm.model_executor.layers.quantization.utils.marlin_utils.moe_awq_to_marlin_zero_points", "vllm.model_executor.layers.quantization.utils.marlin_utils.query_marlin_supported_quant_types", "vllm.model_executor.layers.quantization.utils.marlin_utils.should_use_atomic_add_reduce", "vllm.model_executor.layers.quantization.utils.marlin_utils.verify_marlin_supported", "vllm.model_executor.layers.quantization.utils.marlin_utils.verify_marlin_supports_shape" ], "n_typable": 129, "n_typed": 116, "n_any": 0, "n_untyped": 13, "n_functions": 29, "n_function_overloads": 29, "n_function_params": 99, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/marlin_utils_fp4.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.prepare_moe_fp4_layer_for_marlin", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.is_fp4_marlin_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.prepare_nvfp4_moe_layer_for_marlin", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.rand_marlin_weight_mxfp4_like", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.mxfp4_marlin_process_scales", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.nvfp4_marlin_process_scales", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.prepare_fp4_layer_for_marlin", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.nvfp4_marlin_process_global_scale", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.rand_marlin_weight_nvfp4_like", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.apply_fp4_marlin_linear", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.FP4_MARLIN_SUPPORTED_GROUP_SIZES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4", "names": [ "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.FP4_MARLIN_SUPPORTED_GROUP_SIZES", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.apply_fp4_marlin_linear", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.is_fp4_marlin_supported", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.logger", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.mxfp4_marlin_process_scales", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.nvfp4_marlin_process_global_scale", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.nvfp4_marlin_process_scales", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.prepare_fp4_layer_for_marlin", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.prepare_moe_fp4_layer_for_marlin", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.prepare_nvfp4_moe_layer_for_marlin", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.rand_marlin_weight_mxfp4_like", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp4.rand_marlin_weight_nvfp4_like" ], "n_typable": 43, "n_typed": 26, "n_any": 0, "n_untyped": 17, "n_functions": 10, "n_function_overloads": 10, "n_function_params": 32, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/marlin_utils_fp8.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.fp8_fused_exponent_bias_into_scales", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.prepare_fp8_layer_for_marlin", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.is_fp8_marlin_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.pack_fp8_to_int32", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.marlin_quant_fp8_torch", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.apply_fp8_marlin_linear", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.prepare_fp8_moe_layer_for_marlin", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8", "names": [ "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.apply_fp8_marlin_linear", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.fp8_fused_exponent_bias_into_scales", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.is_fp8_marlin_supported", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.logger", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.marlin_quant_fp8_torch", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.pack_fp8_to_int32", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.prepare_fp8_layer_for_marlin", "vllm.model_executor.layers.quantization.utils.marlin_utils_fp8.prepare_fp8_moe_layer_for_marlin" ], "n_typable": 31, "n_typed": 23, "n_any": 0, "n_untyped": 8, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 23, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/marlin_utils_test.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_test.awq_marlin_quantize", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_test.MarlinWorkspace", "methods": [ { "kind": "function", "name": "MarlinWorkspace.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MarlinWorkspace.scratch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_test.marlin_permute_weights", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_test.get_weight_perm", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_test.marlin_quantize", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_test.marlin_weights", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.marlin_utils_test", "names": [ "vllm.model_executor.layers.quantization.utils.marlin_utils_test.MarlinWorkspace", "vllm.model_executor.layers.quantization.utils.marlin_utils_test.awq_marlin_quantize", "vllm.model_executor.layers.quantization.utils.marlin_utils_test.get_weight_perm", "vllm.model_executor.layers.quantization.utils.marlin_utils_test.marlin_permute_weights", "vllm.model_executor.layers.quantization.utils.marlin_utils_test.marlin_quantize", "vllm.model_executor.layers.quantization.utils.marlin_utils_test.marlin_weights" ], "n_typable": 34, "n_typed": 12, "n_any": 0, "n_untyped": 22, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 24, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/mxfp4_utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.mxfp4_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.mxfp4_utils.get_padding_alignment", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.mxfp4_utils", "names": [ "vllm.model_executor.layers.quantization.utils.mxfp4_utils.get_padding_alignment", "vllm.model_executor.layers.quantization.utils.mxfp4_utils.logger" ], "n_typable": 2, "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/mxfp6_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.mxfp6_utils.dequant_mxfp6", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.mxfp6_utils.quant_dequant_mxfp6", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.mxfp6_utils", "names": [ "vllm.model_executor.layers.quantization.utils.mxfp6_utils.dequant_mxfp6", "vllm.model_executor.layers.quantization.utils.mxfp6_utils.quant_dequant_mxfp6" ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/mxfp8_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.mxfp8_utils.dequant_mxfp8_to_bf16", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.mxfp8_utils.swizzle_mxfp8_scale", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.mxfp8_utils.MXFP8_BLOCK_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.mxfp8_utils.mxfp8_e4m3_quantize", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.mxfp8_utils.mxfp8_e4m3_quantize_fake", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.utils.mxfp8_utils.Mxfp8LinearBackend", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Mxfp8LinearBackend.EMULATION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Mxfp8LinearBackend.FLASHINFER_CUTLASS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.mxfp8_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.utils.mxfp8_utils.Mxfp8LinearOp", "methods": [ { "kind": "function", "name": "Mxfp8LinearOp.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mxfp8LinearOp._apply_emulation", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Mxfp8LinearOp._apply_flashinfer_cutlass", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Mxfp8LinearOp.apply", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Mxfp8LinearOp.backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 19, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 16, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.mxfp8_utils", "names": [ "vllm.model_executor.layers.quantization.utils.mxfp8_utils.MXFP8_BLOCK_SIZE", "vllm.model_executor.layers.quantization.utils.mxfp8_utils.Mxfp8LinearBackend", "vllm.model_executor.layers.quantization.utils.mxfp8_utils.Mxfp8LinearOp", "vllm.model_executor.layers.quantization.utils.mxfp8_utils.dequant_mxfp8_to_bf16", "vllm.model_executor.layers.quantization.utils.mxfp8_utils.logger", "vllm.model_executor.layers.quantization.utils.mxfp8_utils.mxfp8_e4m3_quantize", "vllm.model_executor.layers.quantization.utils.mxfp8_utils.mxfp8_e4m3_quantize_fake", "vllm.model_executor.layers.quantization.utils.mxfp8_utils.swizzle_mxfp8_scale" ], "n_typable": 35, "n_typed": 32, "n_any": 0, "n_untyped": 3, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 9, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 16, "n_classes": 2, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/nvfp4_emulation_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_emulation_utils.dequantize_to_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_emulation_utils.break_fp4_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_emulation_utils.ref_nvfp4_quant", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.nvfp4_emulation_utils", "names": [ "vllm.model_executor.layers.quantization.utils.nvfp4_emulation_utils.break_fp4_bytes", "vllm.model_executor.layers.quantization.utils.nvfp4_emulation_utils.dequantize_to_dtype", "vllm.model_executor.layers.quantization.utils.nvfp4_emulation_utils.ref_nvfp4_quant" ], "n_typable": 14, "n_typed": 0, "n_any": 0, "n_untyped": 14, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 11, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/nvfp4_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_utils.pad_nvfp4_weight_for_cutlass", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_utils.convert_to_nvfp4_linear_kernel_format", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_utils.select_nvfp4_linear_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_utils.swizzle_blockscale", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_utils.NvFp4LinearBackend", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NvFp4LinearBackend.VLLM_CUTLASS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NvFp4LinearBackend.FLASHINFER_CUTLASS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NvFp4LinearBackend.FLASHINFER_TRTLLM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NvFp4LinearBackend.FLASHINFER_CUDNN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NvFp4LinearBackend.FBGEMM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NvFp4LinearBackend.MARLIN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NvFp4LinearBackend.EMULATION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_utils.prepare_weights_for_nvfp4_fbgemm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_utils.pad_nvfp4_activation_for_cutlass", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_utils.cutlass_fp4_supported", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_utils.prepare_weights_for_nvfp4_cutlass", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_utils.slice_nvfp4_output", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_utils.apply_nvfp4_linear", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.nvfp4_utils.prepare_weights_for_nvfp4_flashinfer_trtllm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.nvfp4_utils", "names": [ "vllm.model_executor.layers.quantization.utils.nvfp4_utils.NvFp4LinearBackend", "vllm.model_executor.layers.quantization.utils.nvfp4_utils.apply_nvfp4_linear", "vllm.model_executor.layers.quantization.utils.nvfp4_utils.convert_to_nvfp4_linear_kernel_format", "vllm.model_executor.layers.quantization.utils.nvfp4_utils.cutlass_fp4_supported", "vllm.model_executor.layers.quantization.utils.nvfp4_utils.logger", "vllm.model_executor.layers.quantization.utils.nvfp4_utils.pad_nvfp4_activation_for_cutlass", "vllm.model_executor.layers.quantization.utils.nvfp4_utils.pad_nvfp4_weight_for_cutlass", "vllm.model_executor.layers.quantization.utils.nvfp4_utils.prepare_weights_for_nvfp4_cutlass", "vllm.model_executor.layers.quantization.utils.nvfp4_utils.prepare_weights_for_nvfp4_fbgemm", "vllm.model_executor.layers.quantization.utils.nvfp4_utils.prepare_weights_for_nvfp4_flashinfer_trtllm", "vllm.model_executor.layers.quantization.utils.nvfp4_utils.select_nvfp4_linear_backend", "vllm.model_executor.layers.quantization.utils.nvfp4_utils.slice_nvfp4_output", "vllm.model_executor.layers.quantization.utils.nvfp4_utils.swizzle_blockscale" ], "n_typable": 31, "n_typed": 30, "n_any": 0, "n_untyped": 1, "n_functions": 11, "n_function_overloads": 11, "n_function_params": 19, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/ocp_mx_utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.ocp_mx_utils.OCP_MX_BLOCK_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.ocp_mx_utils.SUPPORTED_OCP_MX_DTYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.utils.ocp_mx_utils.OCP_MX_Scheme", "methods": [ { "kind": "function", "name": "OCP_MX_Scheme.from_quant_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OCP_MX_Scheme.w_mxfp4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OCP_MX_Scheme.w_mxfp4_a_mxfp4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OCP_MX_Scheme.w_mxfp4_a_mxfp6_e3m2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OCP_MX_Scheme.w_mxfp4_a_mxfp6_e2m3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OCP_MX_Scheme.w_mxfp4_a_fp8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OCP_MX_Scheme.w_mxfp6_e3m2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OCP_MX_Scheme.w_mxfp6_e3m2_a_mxfp6_e3m2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OCP_MX_Scheme.w_mxfp6_e3m2_a_fp8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OCP_MX_Scheme.w_mxfp6_e2m3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OCP_MX_Scheme.w_mxfp6_e2m3_a_mxfp6_e2m3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OCP_MX_Scheme.w_mxfp6_e2m3_a_fp8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 11, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.ocp_mx_utils.OCP_MX_DTYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.ocp_mx_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.ocp_mx_utils", "names": [ "vllm.model_executor.layers.quantization.utils.ocp_mx_utils.OCP_MX_BLOCK_SIZE", "vllm.model_executor.layers.quantization.utils.ocp_mx_utils.OCP_MX_DTYPES", "vllm.model_executor.layers.quantization.utils.ocp_mx_utils.OCP_MX_Scheme", "vllm.model_executor.layers.quantization.utils.ocp_mx_utils.SUPPORTED_OCP_MX_DTYPES", "vllm.model_executor.layers.quantization.utils.ocp_mx_utils.logger" ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_classes": 1, "n_attrs": 15, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/petit_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.petit_utils.apply_petit_nvfp4_linear", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.petit_utils.verify_petit_nvfp4_supported", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.petit_utils.prepare_nvfp4_layer_for_petit", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.petit_utils", "names": [ "vllm.model_executor.layers.quantization.utils.petit_utils.apply_petit_nvfp4_linear", "vllm.model_executor.layers.quantization.utils.petit_utils.prepare_nvfp4_layer_for_petit", "vllm.model_executor.layers.quantization.utils.petit_utils.verify_petit_nvfp4_supported" ], "n_typable": 13, "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 10, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/quant_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.convert_packed_uint4b8_to_signed_int4_inplace", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kMxfp4Dynamic", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kNvfp4Static", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.get_fp8_min_max", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.unpack_quantized_values_into_int32", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.unpack_cols", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8StaticTensorSym", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kMxfp4StaticGroupScale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kMxfp4Static", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.scaled_quantize", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8StaticChannelSym", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.SUPPORTED_GROUP_SIZES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.is_layer_skipped", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.group_broadcast", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kStaticChannelScale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kDynamic128Scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.pack_cols", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.awq_pack", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kStaticTokenScale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kMxfp8DynamicGroupScale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.scaled_dequantize", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.pack_quantized_values_into_int32", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kMxfp8Dynamic", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.convert_bf16_scales_to_fp8", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.sort_weights", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.ScaleDesc", "methods": [ { "kind": "function", "name": "ScaleDesc.__str__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ScaleDesc.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleDesc.static", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleDesc.group_shape", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8DynamicTensorSym", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.QuantKey", "methods": [ { "kind": "function", "name": "QuantKey.__str__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QuantKey.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QuantKey.scale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QuantKey.scale2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QuantKey.symmetric", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.pack_rows", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.get_attribute_fallback", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.get_pack_factor", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8StaticTokenSym", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kMxfp4DynamicGroupScale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kDynamicTokenScale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kNvfp4StaticGroupScale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kDynamic64Scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kDynamicTensorScale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8Dynamic64Sym", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.gptq_pack", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.GroupShape", "methods": [ { "kind": "function", "name": "GroupShape.is_per_tensor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GroupShape.is_per_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GroupShape.is_per_channel", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GroupShape.is_per_group", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GroupShape.PER_TENSOR", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GroupShape.PER_TOKEN", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GroupShape.PER_CHANNEL", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.SUPPORTED_GPTQ_QUANT_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.gptq_quantize_weights", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kNvfp4Dynamic", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8Dynamic128Sym", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.quantize_weights", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.prep_scale_for_group_broadcast", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kStaticTensorScale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.FP8_DTYPE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kStatic128BlockScale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.permute_rows", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.get_and_maybe_dequant_weights", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8Static128BlockSym", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kNvfp4DynamicGroupScale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8DynamicTokenSym", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.quant_utils", "names": [ "vllm.model_executor.layers.quantization.utils.quant_utils.FP8_DTYPE", "vllm.model_executor.layers.quantization.utils.quant_utils.GroupShape", "vllm.model_executor.layers.quantization.utils.quant_utils.QuantKey", "vllm.model_executor.layers.quantization.utils.quant_utils.SUPPORTED_GPTQ_QUANT_TYPES", "vllm.model_executor.layers.quantization.utils.quant_utils.SUPPORTED_GROUP_SIZES", "vllm.model_executor.layers.quantization.utils.quant_utils.ScaleDesc", "vllm.model_executor.layers.quantization.utils.quant_utils.awq_pack", "vllm.model_executor.layers.quantization.utils.quant_utils.convert_bf16_scales_to_fp8", "vllm.model_executor.layers.quantization.utils.quant_utils.convert_packed_uint4b8_to_signed_int4_inplace", "vllm.model_executor.layers.quantization.utils.quant_utils.get_and_maybe_dequant_weights", "vllm.model_executor.layers.quantization.utils.quant_utils.get_attribute_fallback", "vllm.model_executor.layers.quantization.utils.quant_utils.get_fp8_min_max", "vllm.model_executor.layers.quantization.utils.quant_utils.get_pack_factor", "vllm.model_executor.layers.quantization.utils.quant_utils.gptq_pack", "vllm.model_executor.layers.quantization.utils.quant_utils.gptq_quantize_weights", "vllm.model_executor.layers.quantization.utils.quant_utils.group_broadcast", "vllm.model_executor.layers.quantization.utils.quant_utils.is_layer_skipped", "vllm.model_executor.layers.quantization.utils.quant_utils.kDynamic128Scale", "vllm.model_executor.layers.quantization.utils.quant_utils.kDynamic64Scale", "vllm.model_executor.layers.quantization.utils.quant_utils.kDynamicTensorScale", "vllm.model_executor.layers.quantization.utils.quant_utils.kDynamicTokenScale", "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8Dynamic128Sym", "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8Dynamic64Sym", "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8DynamicTensorSym", "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8DynamicTokenSym", "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8Static128BlockSym", "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8StaticChannelSym", "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8StaticTensorSym", "vllm.model_executor.layers.quantization.utils.quant_utils.kFp8StaticTokenSym", "vllm.model_executor.layers.quantization.utils.quant_utils.kMxfp4Dynamic", "vllm.model_executor.layers.quantization.utils.quant_utils.kMxfp4DynamicGroupScale", "vllm.model_executor.layers.quantization.utils.quant_utils.kMxfp4Static", "vllm.model_executor.layers.quantization.utils.quant_utils.kMxfp4StaticGroupScale", "vllm.model_executor.layers.quantization.utils.quant_utils.kMxfp8Dynamic", "vllm.model_executor.layers.quantization.utils.quant_utils.kMxfp8DynamicGroupScale", "vllm.model_executor.layers.quantization.utils.quant_utils.kNvfp4Dynamic", "vllm.model_executor.layers.quantization.utils.quant_utils.kNvfp4DynamicGroupScale", "vllm.model_executor.layers.quantization.utils.quant_utils.kNvfp4Static", "vllm.model_executor.layers.quantization.utils.quant_utils.kNvfp4StaticGroupScale", "vllm.model_executor.layers.quantization.utils.quant_utils.kStatic128BlockScale", "vllm.model_executor.layers.quantization.utils.quant_utils.kStaticChannelScale", "vllm.model_executor.layers.quantization.utils.quant_utils.kStaticTensorScale", "vllm.model_executor.layers.quantization.utils.quant_utils.kStaticTokenScale", "vllm.model_executor.layers.quantization.utils.quant_utils.pack_cols", "vllm.model_executor.layers.quantization.utils.quant_utils.pack_quantized_values_into_int32", "vllm.model_executor.layers.quantization.utils.quant_utils.pack_rows", "vllm.model_executor.layers.quantization.utils.quant_utils.permute_rows", "vllm.model_executor.layers.quantization.utils.quant_utils.prep_scale_for_group_broadcast", "vllm.model_executor.layers.quantization.utils.quant_utils.quantize_weights", "vllm.model_executor.layers.quantization.utils.quant_utils.scaled_dequantize", "vllm.model_executor.layers.quantization.utils.quant_utils.scaled_quantize", "vllm.model_executor.layers.quantization.utils.quant_utils.sort_weights", "vllm.model_executor.layers.quantization.utils.quant_utils.unpack_cols", "vllm.model_executor.layers.quantization.utils.quant_utils.unpack_quantized_values_into_int32" ], "n_typable": 125, "n_typed": 77, "n_any": 0, "n_untyped": 48, "n_functions": 22, "n_function_overloads": 22, "n_function_params": 67, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 0, "n_classes": 3, "n_attrs": 39, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/quantization/utils/w8a8_utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.w8a8_utils.CUTLASS_FP8_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.w8a8_utils.requantize_with_max_scale", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.w8a8_utils.cutlass_group_gemm_supported", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.w8a8_utils.cutlass_fp8_supported", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.w8a8_utils.cutlass_block_fp8_supported", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.w8a8_utils.sparse_cutlass_supported", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.w8a8_utils.per_tensor_dequantize", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.w8a8_utils.all_close_1d", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.w8a8_utils.convert_to_channelwise", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.layers.quantization.utils.w8a8_utils.CUTLASS_BLOCK_FP8_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.quantization.utils.w8a8_utils.normalize_e4m3fn_to_e4m3fnuz", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.layers.quantization.utils.w8a8_utils", "names": [ "vllm.model_executor.layers.quantization.utils.w8a8_utils.CUTLASS_BLOCK_FP8_SUPPORTED", "vllm.model_executor.layers.quantization.utils.w8a8_utils.CUTLASS_FP8_SUPPORTED", "vllm.model_executor.layers.quantization.utils.w8a8_utils.all_close_1d", "vllm.model_executor.layers.quantization.utils.w8a8_utils.convert_to_channelwise", "vllm.model_executor.layers.quantization.utils.w8a8_utils.cutlass_block_fp8_supported", "vllm.model_executor.layers.quantization.utils.w8a8_utils.cutlass_fp8_supported", "vllm.model_executor.layers.quantization.utils.w8a8_utils.cutlass_group_gemm_supported", "vllm.model_executor.layers.quantization.utils.w8a8_utils.normalize_e4m3fn_to_e4m3fnuz", "vllm.model_executor.layers.quantization.utils.w8a8_utils.per_tensor_dequantize", "vllm.model_executor.layers.quantization.utils.w8a8_utils.requantize_with_max_scale", "vllm.model_executor.layers.quantization.utils.w8a8_utils.sparse_cutlass_supported" ], "n_typable": 22, "n_typed": 20, "n_any": 0, "n_untyped": 2, "n_functions": 9, "n_function_overloads": 9, "n_function_params": 11, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/resampler.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.resampler.get_2d_sincos_pos_embed", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.layers.resampler.BaseResampler", "methods": [ { "kind": "function", "name": "BaseResampler.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "BaseResampler._repeat", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseResampler.num_queries", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseResampler.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseResampler.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseResampler.query", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseResampler.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseResampler.ln_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseResampler.ln_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseResampler.do_post_projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseResampler.kv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseResampler.ln_post", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseResampler.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 10, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 11, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.resampler.get_abs_pos", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.layers.resampler.Resampler2", "methods": [ { "kind": "function", "name": "Resampler2.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "Resampler2.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Resampler2.adaptive", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Resampler2.pos_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 14, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.resampler.get_1d_sincos_pos_embed_from_grid", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.model_executor.layers.resampler.DEFAULT_LN", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.resampler.get_2d_sincos_pos_embed_from_grid", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.layers.resampler", "names": [ "vllm.model_executor.layers.resampler.BaseResampler", "vllm.model_executor.layers.resampler.DEFAULT_LN", "vllm.model_executor.layers.resampler.Resampler2", "vllm.model_executor.layers.resampler.get_1d_sincos_pos_embed_from_grid", "vllm.model_executor.layers.resampler.get_2d_sincos_pos_embed", "vllm.model_executor.layers.resampler.get_2d_sincos_pos_embed_from_grid", "vllm.model_executor.layers.resampler.get_abs_pos" ], "n_typable": 56, "n_typed": 40, "n_any": 0, "n_untyped": 16, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 12, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 22, "n_classes": 2, "n_attrs": 14, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/__init__.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.rotary_embedding.get_rope", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding", "names": [ "vllm.model_executor.layers.rotary_embedding.get_rope" ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/base.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.base.RotaryEmbedding", "methods": [ { "kind": "function", "name": "RotaryEmbedding.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "RotaryEmbedding.forward_static", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "RotaryEmbedding.forward_native", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RotaryEmbedding.forward_cuda", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RotaryEmbedding.forward_hip", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RotaryEmbedding.forward_xpu", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RotaryEmbedding.forward_cpu", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RotaryEmbedding.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 37, "n_typed": 37, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 29, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.base.RotaryEmbeddingBase", "methods": [ { "kind": "function", "name": "RotaryEmbeddingBase.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "RotaryEmbeddingBase._compute_inv_freq", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RotaryEmbeddingBase._compute_cos_sin_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RotaryEmbeddingBase._match_cos_sin_cache_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RotaryEmbeddingBase.get_cos_sin", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RotaryEmbeddingBase.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RotaryEmbeddingBase.rotary_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RotaryEmbeddingBase.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RotaryEmbeddingBase.base", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RotaryEmbeddingBase.is_neox_style", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RotaryEmbeddingBase.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RotaryEmbeddingBase.use_aiter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RotaryEmbeddingBase.apply_rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RotaryEmbeddingBase.use_flashinfer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RotaryEmbeddingBase.rocm_aiter_triton_rotary_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RotaryEmbeddingBase.cos_sin_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 26, "n_typed": 16, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 11, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.base", "names": [ "vllm.model_executor.layers.rotary_embedding.base.RotaryEmbedding", "vllm.model_executor.layers.rotary_embedding.base.RotaryEmbeddingBase" ], "n_typable": 63, "n_typed": 53, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 39, "n_classes": 2, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/common.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.common.ApplyRotaryEmb", "methods": [ { "kind": "function", "name": "ApplyRotaryEmb.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ApplyRotaryEmb.forward_static", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ApplyRotaryEmb._pre_process", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ApplyRotaryEmb._post_process", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ApplyRotaryEmb.forward_native", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ApplyRotaryEmb.forward_cuda", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ApplyRotaryEmb.forward_hip", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ApplyRotaryEmb.forward_cpu", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ApplyRotaryEmb.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ApplyRotaryEmb.is_neox_style", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApplyRotaryEmb.enable_fp32_compute", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApplyRotaryEmb.apply_rotary_emb_flash_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 38, "n_typed": 35, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 26, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.rotary_embedding.common.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.rotary_embedding.common.rotate_neox", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.rotary_embedding.common.rotate_gptj", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.rotary_embedding.common.yarn_find_correction_dim", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.rotary_embedding.common.yarn_find_correction_range", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.rotary_embedding.common.yarn_get_mscale", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.rotary_embedding.common.yarn_linear_ramp_mask", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.common", "names": [ "vllm.model_executor.layers.rotary_embedding.common.ApplyRotaryEmb", "vllm.model_executor.layers.rotary_embedding.common.logger", "vllm.model_executor.layers.rotary_embedding.common.rotate_gptj", "vllm.model_executor.layers.rotary_embedding.common.rotate_neox", "vllm.model_executor.layers.rotary_embedding.common.yarn_find_correction_dim", "vllm.model_executor.layers.rotary_embedding.common.yarn_find_correction_range", "vllm.model_executor.layers.rotary_embedding.common.yarn_get_mscale", "vllm.model_executor.layers.rotary_embedding.common.yarn_linear_ramp_mask" ], "n_typable": 62, "n_typed": 58, "n_any": 0, "n_untyped": 4, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 17, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 26, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/deepseek_scaling_rope.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.rotary_embedding.deepseek_scaling_rope.yarn_get_mscale", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.deepseek_scaling_rope.DeepseekScalingRotaryEmbedding", "methods": [ { "kind": "function", "name": "DeepseekScalingRotaryEmbedding.__init__", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "DeepseekScalingRotaryEmbedding._compute_inv_freq", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekScalingRotaryEmbedding._compute_cos_sin_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepseekScalingRotaryEmbedding.forward_native", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepseekScalingRotaryEmbedding.forward_hip", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepseekScalingRotaryEmbedding.forward_cuda", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekScalingRotaryEmbedding.scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekScalingRotaryEmbedding.extrapolation_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekScalingRotaryEmbedding.attn_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekScalingRotaryEmbedding.beta_fast", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekScalingRotaryEmbedding.beta_slow", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekScalingRotaryEmbedding.mscale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekScalingRotaryEmbedding.use_flashinfer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 39, "n_typed": 32, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 26, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.deepseek_scaling_rope", "names": [ "vllm.model_executor.layers.rotary_embedding.deepseek_scaling_rope.DeepseekScalingRotaryEmbedding", "vllm.model_executor.layers.rotary_embedding.deepseek_scaling_rope.yarn_get_mscale" ], "n_typable": 42, "n_typed": 35, "n_any": 0, "n_untyped": 7, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 26, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/dual_chunk_rope.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.dual_chunk_rope.DualChunkRotaryEmbedding", "methods": [ { "kind": "function", "name": "DualChunkRotaryEmbedding.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "DualChunkRotaryEmbedding._compute_inv_freq", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DualChunkRotaryEmbedding._compute_cos_sin_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DualChunkRotaryEmbedding.forward_native", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DualChunkRotaryEmbedding.forward_cuda", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DualChunkRotaryEmbedding._apply_rotary_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DualChunkRotaryEmbedding.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DualChunkRotaryEmbedding.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DualChunkRotaryEmbedding.rotary_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DualChunkRotaryEmbedding.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DualChunkRotaryEmbedding.base", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DualChunkRotaryEmbedding.is_neox_style", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DualChunkRotaryEmbedding.chunk_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DualChunkRotaryEmbedding.local_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DualChunkRotaryEmbedding.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DualChunkRotaryEmbedding.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 36, "n_typed": 23, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 20, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.dual_chunk_rope", "names": [ "vllm.model_executor.layers.rotary_embedding.dual_chunk_rope.DualChunkRotaryEmbedding" ], "n_typable": 36, "n_typed": 23, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 20, "n_classes": 1, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/dynamic_ntk_alpha_rope.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.dynamic_ntk_alpha_rope.DynamicNTKAlphaRotaryEmbedding", "methods": [ { "kind": "function", "name": "DynamicNTKAlphaRotaryEmbedding.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "DynamicNTKAlphaRotaryEmbedding._compute_cos_sin_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DynamicNTKAlphaRotaryEmbedding.scaling_alpha", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.dynamic_ntk_alpha_rope", "names": [ "vllm.model_executor.layers.rotary_embedding.dynamic_ntk_alpha_rope.DynamicNTKAlphaRotaryEmbedding" ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/dynamic_ntk_scaling_rope.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.dynamic_ntk_scaling_rope.DynamicNTKScalingRotaryEmbedding", "methods": [ { "kind": "function", "name": "DynamicNTKScalingRotaryEmbedding.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "DynamicNTKScalingRotaryEmbedding._compute_cos_sin_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DynamicNTKScalingRotaryEmbedding.scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.dynamic_ntk_scaling_rope", "names": [ "vllm.model_executor.layers.rotary_embedding.dynamic_ntk_scaling_rope.DynamicNTKScalingRotaryEmbedding" ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/ernie45_vl_rope.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.ernie45_vl_rope.Ernie4_5_VLRotaryEmbedding", "methods": [ { "kind": "function", "name": "Ernie4_5_VLRotaryEmbedding.forward_native", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Ernie4_5_VLRotaryEmbedding.forward_cuda", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.ernie45_vl_rope", "names": [ "vllm.model_executor.layers.rotary_embedding.ernie45_vl_rope.Ernie4_5_VLRotaryEmbedding" ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/fope.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.fope.FourierRotaryEmbedding", "methods": [ { "kind": "function", "name": "FourierRotaryEmbedding.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "FourierRotaryEmbedding._compute_inv_freq", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FourierRotaryEmbedding._compute_cos_sin_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FourierRotaryEmbedding.forward_native", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FourierRotaryEmbedding.weight_loader", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FourierRotaryEmbedding.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FourierRotaryEmbedding.num_inv_freq", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FourierRotaryEmbedding.fope_sep_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FourierRotaryEmbedding.fope_init_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FourierRotaryEmbedding.inv_freq", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FourierRotaryEmbedding.input_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FourierRotaryEmbedding.output_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FourierRotaryEmbedding.cos_coef", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FourierRotaryEmbedding.sin_coef", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FourierRotaryEmbedding.cos_sin_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FourierRotaryEmbedding.update_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 23, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 18, "n_attrs": 11, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.fope", "names": [ "vllm.model_executor.layers.rotary_embedding.fope.FourierRotaryEmbedding" ], "n_typable": 34, "n_typed": 23, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 18, "n_classes": 1, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/linear_scaling_rope.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.linear_scaling_rope.LinearScalingRotaryEmbedding", "methods": [ { "kind": "function", "name": "LinearScalingRotaryEmbedding.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "LinearScalingRotaryEmbedding._compute_cos_sin_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "LinearScalingRotaryEmbedding.scaling_factor_to_offset", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "LinearScalingRotaryEmbedding.scaling_factors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 1, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.linear_scaling_rope", "names": [ "vllm.model_executor.layers.rotary_embedding.linear_scaling_rope.LinearScalingRotaryEmbedding" ], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_classes": 1, "n_attrs": 1, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/llama3_rope.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.llama3_rope.Llama3RotaryEmbedding", "methods": [ { "kind": "function", "name": "Llama3RotaryEmbedding.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "Llama3RotaryEmbedding._compute_inv_freq", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama3RotaryEmbedding.scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama3RotaryEmbedding.low_freq_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama3RotaryEmbedding.high_freq_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama3RotaryEmbedding.orig_max_position", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 13, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.llama3_rope", "names": [ "vllm.model_executor.layers.rotary_embedding.llama3_rope.Llama3RotaryEmbedding" ], "n_typable": 17, "n_typed": 13, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/llama4_vision_rope.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.llama4_vision_rope.Llama4VisionRotaryEmbedding", "methods": [ { "kind": "function", "name": "Llama4VisionRotaryEmbedding.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Llama4VisionRotaryEmbedding._compute_inv_freq", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Llama4VisionRotaryEmbedding._compute_cos_sin_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Llama4VisionRotaryEmbedding.forward_native", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Llama4VisionRotaryEmbedding.forward_cuda", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 16, "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.llama4_vision_rope", "names": [ "vllm.model_executor.layers.rotary_embedding.llama4_vision_rope.Llama4VisionRotaryEmbedding" ], "n_typable": 16, "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 11, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/mrope.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.rotary_embedding.mrope.triton_mrope", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.model_executor.layers.rotary_embedding.mrope.apply_interleaved_rope", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.mrope.MRotaryEmbedding", "methods": [ { "kind": "function", "name": "MRotaryEmbedding.__init__", "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "MRotaryEmbedding._compute_inv_freq", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MRotaryEmbedding._compute_cos_sin_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MRotaryEmbedding.forward_native", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MRotaryEmbedding.forward_cuda", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MRotaryEmbedding.forward_cpu", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MRotaryEmbedding.get_next_input_positions", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MRotaryEmbedding.get_next_input_positions_tensor", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MRotaryEmbedding.scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRotaryEmbedding.extrapolation_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRotaryEmbedding.attn_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRotaryEmbedding.beta_fast", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRotaryEmbedding.beta_slow", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRotaryEmbedding.truncate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRotaryEmbedding.cache_max_position_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRotaryEmbedding.mrope_section", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRotaryEmbedding.mrope_interleaved", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRotaryEmbedding.mscale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 53, "n_typed": 42, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 35, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.mrope", "names": [ "vllm.model_executor.layers.rotary_embedding.mrope.MRotaryEmbedding", "vllm.model_executor.layers.rotary_embedding.mrope.apply_interleaved_rope", "vllm.model_executor.layers.rotary_embedding.mrope.triton_mrope" ], "n_typable": 65, "n_typed": 54, "n_any": 0, "n_untyped": 11, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 10, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 35, "n_classes": 1, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/mrope_interleaved.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.mrope_interleaved.MRotaryEmbeddingInterleaved", "methods": [ { "kind": "function", "name": "MRotaryEmbeddingInterleaved.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "MRotaryEmbeddingInterleaved._rebuild_pos_emb", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MRotaryEmbeddingInterleaved.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MRotaryEmbeddingInterleaved.get_mrope_interleaved_id_list", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MRotaryEmbeddingInterleaved.cache_max_position_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRotaryEmbeddingInterleaved.mrope_section", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRotaryEmbeddingInterleaved.mrope_interleaved", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRotaryEmbeddingInterleaved.mrope_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRotaryEmbeddingInterleaved.layer_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 20, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 16, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.mrope_interleaved", "names": [ "vllm.model_executor.layers.rotary_embedding.mrope_interleaved.MRotaryEmbeddingInterleaved" ], "n_typable": 25, "n_typed": 20, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 16, "n_classes": 1, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/ntk_scaling_rope.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.ntk_scaling_rope.NTKScalingRotaryEmbedding", "methods": [ { "kind": "function", "name": "NTKScalingRotaryEmbedding.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "NTKScalingRotaryEmbedding._compute_inv_freq", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NTKScalingRotaryEmbedding.scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NTKScalingRotaryEmbedding.mixed_b", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 11, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.ntk_scaling_rope", "names": [ "vllm.model_executor.layers.rotary_embedding.ntk_scaling_rope.NTKScalingRotaryEmbedding" ], "n_typable": 13, "n_typed": 11, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/phi3_long_rope_scaled_rope.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.layers.rotary_embedding.phi3_long_rope_scaled_rope.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.phi3_long_rope_scaled_rope.Phi3LongRoPEScaledRotaryEmbedding", "methods": [ { "kind": "function", "name": "Phi3LongRoPEScaledRotaryEmbedding.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "Phi3LongRoPEScaledRotaryEmbedding._compute_inv_freq", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi3LongRoPEScaledRotaryEmbedding._compute_cos_sin_cache", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Phi3LongRoPEScaledRotaryEmbedding.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Phi3LongRoPEScaledRotaryEmbedding.rotary_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3LongRoPEScaledRotaryEmbedding.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3LongRoPEScaledRotaryEmbedding.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3LongRoPEScaledRotaryEmbedding.original_max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3LongRoPEScaledRotaryEmbedding.base", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3LongRoPEScaledRotaryEmbedding.short_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3LongRoPEScaledRotaryEmbedding.long_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3LongRoPEScaledRotaryEmbedding.use_long_rope", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3LongRoPEScaledRotaryEmbedding.short_mscale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3LongRoPEScaledRotaryEmbedding.long_mscale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 22, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 19, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.phi3_long_rope_scaled_rope", "names": [ "vllm.model_executor.layers.rotary_embedding.phi3_long_rope_scaled_rope.Phi3LongRoPEScaledRotaryEmbedding", "vllm.model_executor.layers.rotary_embedding.phi3_long_rope_scaled_rope.logger" ], "n_typable": 34, "n_typed": 22, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 19, "n_classes": 1, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/xdrope.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.xdrope.XDRotaryEmbedding", "methods": [ { "kind": "function", "name": "XDRotaryEmbedding.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "XDRotaryEmbedding.forward_native", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "XDRotaryEmbedding.forward_cuda", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "XDRotaryEmbedding.get_next_input_positions", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "XDRotaryEmbedding.get_next_input_positions_tensor", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "XDRotaryEmbedding.xdrope_section", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 27, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 23, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.xdrope", "names": [ "vllm.model_executor.layers.rotary_embedding.xdrope.XDRotaryEmbedding" ], "n_typable": 29, "n_typed": 27, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 23, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/rotary_embedding/yarn_scaling_rope.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.rotary_embedding.yarn_scaling_rope.YaRNScalingRotaryEmbedding", "methods": [ { "kind": "function", "name": "YaRNScalingRotaryEmbedding.__init__", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "YaRNScalingRotaryEmbedding._compute_inv_freq", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "YaRNScalingRotaryEmbedding._compute_cos_sin_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "YaRNScalingRotaryEmbedding.scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "YaRNScalingRotaryEmbedding.extrapolation_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "YaRNScalingRotaryEmbedding.attn_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "YaRNScalingRotaryEmbedding.beta_fast", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "YaRNScalingRotaryEmbedding.beta_slow", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "YaRNScalingRotaryEmbedding.truncate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "YaRNScalingRotaryEmbedding.mscale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 17, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 14, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.layers.rotary_embedding.yarn_scaling_rope", "names": [ "vllm.model_executor.layers.rotary_embedding.yarn_scaling_rope.YaRNScalingRotaryEmbedding" ], "n_typable": 24, "n_typed": 17, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 14, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/sparse_attn_indexer.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.sparse_attn_indexer.sparse_attn_indexer_fake", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "attr", "name": "vllm.model_executor.layers.sparse_attn_indexer.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.layers.sparse_attn_indexer.SparseAttnIndexer", "methods": [ { "kind": "function", "name": "SparseAttnIndexer.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "SparseAttnIndexer.forward_native", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SparseAttnIndexer.forward_cuda", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SparseAttnIndexer.forward_hip", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SparseAttnIndexer.k_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SparseAttnIndexer.quant_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SparseAttnIndexer.scale_fmt", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SparseAttnIndexer.topk_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SparseAttnIndexer.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SparseAttnIndexer.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SparseAttnIndexer.max_total_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SparseAttnIndexer.topk_indices_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 19, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 20, "n_attrs": 8, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.sparse_attn_indexer.sparse_attn_indexer", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 } ], "type_ignores": [], "name": "vllm.model_executor.layers.sparse_attn_indexer", "names": [ "vllm.model_executor.layers.sparse_attn_indexer.SparseAttnIndexer", "vllm.model_executor.layers.sparse_attn_indexer.logger", "vllm.model_executor.layers.sparse_attn_indexer.sparse_attn_indexer", "vllm.model_executor.layers.sparse_attn_indexer.sparse_attn_indexer_fake" ], "n_typable": 61, "n_typed": 47, "n_any": 0, "n_untyped": 14, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 26, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 20, "n_classes": 1, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.layers.utils.rocm_unquantized_gemm_impl", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.utils.check_cpu_sgl_kernel", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.utils.apply_penalties", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.utils.is_layer_moe_router_gate", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.utils.dispatch_unquantized_gemm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.utils.default_unquantized_gemm", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.utils.use_aiter_triton_gemm", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.utils.dispatch_cpu_unquantized_gemm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.utils.cpu_unquantized_gemm", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.layers.utils.get_token_bin_counts_and_mask", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.layers.utils.rocm_unquantized_gemm_fake", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.model_executor.layers.utils.MOE_LAYER_ROUTER_GATE_SUFFIXES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.layers.utils.rocm_unquantized_gemm", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "type_ignores": [], "name": "vllm.model_executor.layers.utils", "names": [ "vllm.model_executor.layers.utils.MOE_LAYER_ROUTER_GATE_SUFFIXES", "vllm.model_executor.layers.utils.apply_penalties", "vllm.model_executor.layers.utils.check_cpu_sgl_kernel", "vllm.model_executor.layers.utils.cpu_unquantized_gemm", "vllm.model_executor.layers.utils.default_unquantized_gemm", "vllm.model_executor.layers.utils.dispatch_cpu_unquantized_gemm", "vllm.model_executor.layers.utils.dispatch_unquantized_gemm", "vllm.model_executor.layers.utils.get_token_bin_counts_and_mask", "vllm.model_executor.layers.utils.is_layer_moe_router_gate", "vllm.model_executor.layers.utils.logger", "vllm.model_executor.layers.utils.rocm_unquantized_gemm", "vllm.model_executor.layers.utils.rocm_unquantized_gemm_fake", "vllm.model_executor.layers.utils.rocm_unquantized_gemm_impl", "vllm.model_executor.layers.utils.use_aiter_triton_gemm" ], "n_typable": 50, "n_typed": 42, "n_any": 0, "n_untyped": 8, "n_functions": 12, "n_function_overloads": 12, "n_function_params": 37, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/layers/vocab_parallel_embedding.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.layers.vocab_parallel_embedding.UnquantizedEmbeddingMethod", "methods": [ { "kind": "function", "name": "UnquantizedEmbeddingMethod.create_weights", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "UnquantizedEmbeddingMethod.process_weights_after_loading", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UnquantizedEmbeddingMethod.apply", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "UnquantizedEmbeddingMethod.embedding", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 17, "n_typed": 15, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.vocab_parallel_embedding.get_masked_input_and_mask", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.layers.vocab_parallel_embedding.pad_vocab_size", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.layers.vocab_parallel_embedding.vocab_range_from_global_vocab_size", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.layers.vocab_parallel_embedding.VocabParallelEmbedding", "methods": [ { "kind": "function", "name": "VocabParallelEmbedding.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "VocabParallelEmbedding._get_indices", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "VocabParallelEmbedding.get_sharded_to_full_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VocabParallelEmbedding.weight_loader", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VocabParallelEmbedding.forward_native", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VocabParallelEmbedding.forward_cuda", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VocabParallelEmbedding.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VocabParallelEmbedding.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VocabParallelEmbedding.num_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VocabParallelEmbedding.padding_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VocabParallelEmbedding.org_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VocabParallelEmbedding.org_vocab_size_padded", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VocabParallelEmbedding.num_embeddings_padded", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VocabParallelEmbedding.shard_indices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VocabParallelEmbedding.embedding_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VocabParallelEmbedding.quant_method", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VocabParallelEmbedding.num_added_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VocabParallelEmbedding.num_embeddings_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VocabParallelEmbedding.num_org_embeddings_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VocabParallelEmbedding.num_added_embeddings_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 37, "n_typed": 19, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 17, "n_attrs": 13, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.layers.vocab_parallel_embedding.DEFAULT_VOCAB_PADDING_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.layers.vocab_parallel_embedding.ParallelLMHead", "methods": [ { "kind": "function", "name": "ParallelLMHead.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "ParallelLMHead.tie_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParallelLMHead.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ParallelLMHead.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ParallelLMHead.bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 9, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.layers.vocab_parallel_embedding.vocab_range_from_per_partition_vocab_size", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.layers.vocab_parallel_embedding.VocabParallelEmbeddingShardIndices", "methods": [ { "kind": "function", "name": "VocabParallelEmbeddingShardIndices.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "VocabParallelEmbeddingShardIndices.num_org_elements", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VocabParallelEmbeddingShardIndices.num_added_elements", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VocabParallelEmbeddingShardIndices.num_org_elements_padded", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VocabParallelEmbeddingShardIndices.num_added_elements_padded", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VocabParallelEmbeddingShardIndices.num_org_vocab_padding", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VocabParallelEmbeddingShardIndices.num_added_vocab_padding", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VocabParallelEmbeddingShardIndices.num_elements_padded", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "VocabParallelEmbeddingShardIndices.padded_org_vocab_start_index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VocabParallelEmbeddingShardIndices.padded_org_vocab_end_index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VocabParallelEmbeddingShardIndices.padded_added_vocab_start_index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VocabParallelEmbeddingShardIndices.padded_added_vocab_end_index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VocabParallelEmbeddingShardIndices.org_vocab_start_index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VocabParallelEmbeddingShardIndices.org_vocab_end_index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VocabParallelEmbeddingShardIndices.added_vocab_start_index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VocabParallelEmbeddingShardIndices.added_vocab_end_index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 8, "n_properties": 7 } ], "type_ignores": [], "name": "vllm.model_executor.layers.vocab_parallel_embedding", "names": [ "vllm.model_executor.layers.vocab_parallel_embedding.DEFAULT_VOCAB_PADDING_SIZE", "vllm.model_executor.layers.vocab_parallel_embedding.ParallelLMHead", "vllm.model_executor.layers.vocab_parallel_embedding.UnquantizedEmbeddingMethod", "vllm.model_executor.layers.vocab_parallel_embedding.VocabParallelEmbedding", "vllm.model_executor.layers.vocab_parallel_embedding.VocabParallelEmbeddingShardIndices", "vllm.model_executor.layers.vocab_parallel_embedding.get_masked_input_and_mask", "vllm.model_executor.layers.vocab_parallel_embedding.pad_vocab_size", "vllm.model_executor.layers.vocab_parallel_embedding.vocab_range_from_global_vocab_size", "vllm.model_executor.layers.vocab_parallel_embedding.vocab_range_from_per_partition_vocab_size" ], "n_typable": 96, "n_typed": 69, "n_any": 0, "n_untyped": 27, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 15, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 40, "n_classes": 4, "n_attrs": 24, "n_properties": 7, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/__init__.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.model_loader.get_model_loader", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.get_model", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.model_loader.register_model_loader", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader", "names": [ "vllm.model_executor.model_loader.get_model", "vllm.model_executor.model_loader.get_model_loader", "vllm.model_executor.model_loader.register_model_loader" ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/bitsandbytes_loader.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.model_loader.bitsandbytes_loader.BitsAndBytesModelLoader", "methods": [ { "kind": "function", "name": "BitsAndBytesModelLoader.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BitsAndBytesModelLoader._get_weight_files", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BitsAndBytesModelLoader._prepare_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BitsAndBytesModelLoader._hf_weight_iter", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BitsAndBytesModelLoader._get_quantized_weights_iterator", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BitsAndBytesModelLoader._is_8bit_weight_name", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BitsAndBytesModelLoader._is_4bit_weight_name", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BitsAndBytesModelLoader._quantized_8bit_generator", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BitsAndBytesModelLoader._quantized_4bit_generator", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BitsAndBytesModelLoader._unquantized_generator", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BitsAndBytesModelLoader._get_bnb_target_modules", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BitsAndBytesModelLoader._classify_module_sharding", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BitsAndBytesModelLoader._verify_model_compatibility", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BitsAndBytesModelLoader._initialize_loader_state", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BitsAndBytesModelLoader._dequantize_dq", "n_typed": 0, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BitsAndBytesModelLoader._fuse_moe_quant_states", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BitsAndBytesModelLoader._stack_quantization_states", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BitsAndBytesModelLoader._bind_quant_states_to_params", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BitsAndBytesModelLoader.load_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BitsAndBytesModelLoader.download_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BitsAndBytesModelLoader.possible_config_file_names", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BitsAndBytesModelLoader.unsharded_weights_modules", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesModelLoader.column_sharded_weights_modules", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesModelLoader.maybe_fused_weights_modules", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesModelLoader.target_modules", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesModelLoader.tp_disabled_modules", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesModelLoader.expert_params_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesModelLoader.weight_mapper", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesModelLoader.pre_quant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesModelLoader.load_8bit", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BitsAndBytesModelLoader.is_pool_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 67, "n_typed": 50, "n_any": 1, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 20, "n_method_overloads": 20, "n_method_params": 37, "n_attrs": 11, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.bitsandbytes_loader.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.bitsandbytes_loader", "names": [ "vllm.model_executor.model_loader.bitsandbytes_loader.BitsAndBytesModelLoader", "vllm.model_executor.model_loader.bitsandbytes_loader.logger" ], "n_typable": 68, "n_typed": 50, "n_any": 1, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 20, "n_method_overloads": 20, "n_method_params": 37, "n_classes": 1, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.model_loader.utils.get_model_cls", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.utils.get_architecture_class_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.utils.get_model_architecture", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.model_loader.utils.ParamMapping", "methods": [ { "kind": "function", "name": "ParamMapping.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParamMapping.get_sub_modules", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ParamMapping.packed_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ParamMapping.inverse_packed_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.model_loader.utils.initialize_model", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.model_loader.utils.process_weights_after_loading", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.model_loader.utils.device_loading_context", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.model_loader.utils.configure_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.utils", "names": [ "vllm.model_executor.model_loader.utils.ParamMapping", "vllm.model_executor.model_loader.utils.configure_quant_config", "vllm.model_executor.model_loader.utils.device_loading_context", "vllm.model_executor.model_loader.utils.get_architecture_class_name", "vllm.model_executor.model_loader.utils.get_model_architecture", "vllm.model_executor.model_loader.utils.get_model_cls", "vllm.model_executor.model_loader.utils.initialize_model", "vllm.model_executor.model_loader.utils.logger", "vllm.model_executor.model_loader.utils.process_weights_after_loading" ], "n_typable": 25, "n_typed": 21, "n_any": 0, "n_untyped": 4, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 14, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/gguf_loader.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.model_loader.gguf_loader.GGUFModelLoader", "methods": [ { "kind": "function", "name": "GGUFModelLoader.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GGUFModelLoader._prepare_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GGUFModelLoader._get_gguf_weights_map", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GGUFModelLoader._get_gguf_weight_type", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GGUFModelLoader._get_weights_iterator", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GGUFModelLoader.download_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GGUFModelLoader.load_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GGUFModelLoader.load_model", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 23, "n_typed": 20, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 15, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.gguf_loader.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.gguf_loader", "names": [ "vllm.model_executor.model_loader.gguf_loader.GGUFModelLoader", "vllm.model_executor.model_loader.gguf_loader.logger" ], "n_typable": 24, "n_typed": 20, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 15, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/default_loader.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.model_loader.default_loader.DefaultModelLoader", "methods": [ { "kind": "function", "name": "DefaultModelLoader.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DefaultModelLoader._prepare_weights", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DefaultModelLoader._get_weights_iterator", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DefaultModelLoader.get_all_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DefaultModelLoader.download_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DefaultModelLoader.load_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DefaultModelLoader.DEFAULT_NUM_THREADS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DefaultModelLoader.counter_before_loading_weights", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DefaultModelLoader.counter_after_loading_weights", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 19, "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 11, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.model_loader.default_loader.Source", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Source.model_or_path", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Source.revision", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Source.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Source.fall_back_to_pt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Source.allow_patterns_overrides", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.default_loader.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.default_loader", "names": [ "vllm.model_executor.model_loader.default_loader.DefaultModelLoader", "vllm.model_executor.model_loader.default_loader.Source", "vllm.model_executor.model_loader.default_loader.logger" ], "n_typable": 20, "n_typed": 18, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 11, "n_classes": 2, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/sharded_state_loader.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.model_loader.sharded_state_loader.ShardedStateLoader", "methods": [ { "kind": "function", "name": "ShardedStateLoader.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ShardedStateLoader._filter_subtensors", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ShardedStateLoader._prepare_weights", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ShardedStateLoader.download_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ShardedStateLoader.load_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ShardedStateLoader.iterate_over_files", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ShardedStateLoader.save_model", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ShardedStateLoader.DEFAULT_PATTERN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ShardedStateLoader.pattern", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 16, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 12, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.sharded_state_loader.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.sharded_state_loader", "names": [ "vllm.model_executor.model_loader.sharded_state_loader.ShardedStateLoader", "vllm.model_executor.model_loader.sharded_state_loader.logger" ], "n_typable": 21, "n_typed": 16, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 12, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/tensorizer_loader.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.model_loader.tensorizer_loader.TensorizerLoader", "methods": [ { "kind": "function", "name": "TensorizerLoader.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TensorizerLoader._verify_config", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TensorizerLoader._get_weights_iterator", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TensorizerLoader._load_model_serialized_cpu", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TensorizerLoader.download_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TensorizerLoader._patch_tensorizer_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TensorizerLoader.load_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TensorizerLoader.load_model", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TensorizerLoader.save_model", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TensorizerLoader.tensorizer_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 22, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 15, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.tensorizer_loader.BLACKLISTED_TENSORIZER_ARGS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.tensorizer_loader.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.tensorizer_loader.validate_config", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.tensorizer_loader", "names": [ "vllm.model_executor.model_loader.tensorizer_loader.BLACKLISTED_TENSORIZER_ARGS", "vllm.model_executor.model_loader.tensorizer_loader.TensorizerLoader", "vllm.model_executor.model_loader.tensorizer_loader.logger", "vllm.model_executor.model_loader.tensorizer_loader.validate_config" ], "n_typable": 28, "n_typed": 23, "n_any": 0, "n_untyped": 5, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 15, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/dummy_loader.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.model_loader.dummy_loader.DummyModelLoader", "methods": [ { "kind": "function", "name": "DummyModelLoader.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DummyModelLoader.download_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DummyModelLoader.load_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.dummy_loader", "names": [ "vllm.model_executor.model_loader.dummy_loader.DummyModelLoader" ], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/base_loader.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.model_loader.base_loader.BaseModelLoader", "methods": [ { "kind": "function", "name": "BaseModelLoader.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseModelLoader.download_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseModelLoader.load_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseModelLoader.load_model", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseModelLoader.load_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 10, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.base_loader.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.base_loader.log_model_inspection", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.base_loader", "names": [ "vllm.model_executor.model_loader.base_loader.BaseModelLoader", "vllm.model_executor.model_loader.base_loader.log_model_inspection", "vllm.model_executor.model_loader.base_loader.logger" ], "n_typable": 15, "n_typed": 12, "n_any": 0, "n_untyped": 3, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/runai_streamer_loader.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.model_loader.runai_streamer_loader.RunaiModelStreamerLoader", "methods": [ { "kind": "function", "name": "RunaiModelStreamerLoader.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RunaiModelStreamerLoader._prepare_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RunaiModelStreamerLoader._get_weights_iterator", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RunaiModelStreamerLoader.download_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RunaiModelStreamerLoader.load_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 13, "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.runai_streamer_loader", "names": [ "vllm.model_executor.model_loader.runai_streamer_loader.RunaiModelStreamerLoader" ], "n_typable": 13, "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/reload/layerwise.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.model_loader.reload.layerwise.finalize_layerwise_reload", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.model_loader.reload.layerwise.initialize_layerwise_reload", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.reload.layerwise.record_metadata_for_reloading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.reload.layerwise.get_layerwise_info", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.reload.layerwise", "names": [ "vllm.model_executor.model_loader.reload.layerwise.finalize_layerwise_reload", "vllm.model_executor.model_loader.reload.layerwise.get_layerwise_info", "vllm.model_executor.model_loader.reload.layerwise.initialize_layerwise_reload", "vllm.model_executor.model_loader.reload.layerwise.record_metadata_for_reloading" ], "n_typable": 9, "n_typed": 6, "n_any": 0, "n_untyped": 3, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 5, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/reload/torchao_decorator.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.model_loader.reload.torchao_decorator.support_quantized_model_reload_from_hp_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.reload.torchao_decorator.set_torchao_reload_attrs", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.reload.torchao_decorator", "names": [ "vllm.model_executor.model_loader.reload.torchao_decorator.set_torchao_reload_attrs", "vllm.model_executor.model_loader.reload.torchao_decorator.support_quantized_model_reload_from_hp_weights" ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/reload/meta.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.model_loader.reload.meta.capture_layer_to_meta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.reload.meta.get_numel_loaded", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.model_loader.reload.meta.materialize_layer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.reload.meta.materialize_meta_tensor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.reload.meta.to_meta_tensor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.reload.meta.restore_layer_on_meta", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.reload.meta", "names": [ "vllm.model_executor.model_loader.reload.meta.capture_layer_to_meta", "vllm.model_executor.model_loader.reload.meta.get_numel_loaded", "vllm.model_executor.model_loader.reload.meta.materialize_layer", "vllm.model_executor.model_loader.reload.meta.materialize_meta_tensor", "vllm.model_executor.model_loader.reload.meta.restore_layer_on_meta", "vllm.model_executor.model_loader.reload.meta.to_meta_tensor" ], "n_typable": 14, "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 8, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/reload/sanitize.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.model_loader.reload.sanitize.sanitize_layer_refs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.model_loader.reload.sanitize.restore_layer_refs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.reload.sanitize", "names": [ "vllm.model_executor.model_loader.reload.sanitize.restore_layer_refs", "vllm.model_executor.model_loader.reload.sanitize.sanitize_layer_refs" ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 4, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/reload/types.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.model_loader.reload.types.LayerReloadingInfo", "methods": [ { "kind": "function", "name": "LayerReloadingInfo.reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LayerReloadingInfo.can_process", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LayerReloadingInfo.restore_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerReloadingInfo.kernel_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerReloadingInfo.load_numel", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerReloadingInfo.load_numel_total", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerReloadingInfo.loaded_weights", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.reload.types.LayerTensors", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.reload.types", "names": [ "vllm.model_executor.model_loader.reload.types.LayerReloadingInfo", "vllm.model_executor.model_loader.reload.types.LayerTensors" ], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/reload/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.model_loader.reload.utils.get_layer_tensors", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.reload.utils.get_layer_params_buffers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.reload.utils.get_layer_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.reload.utils", "names": [ "vllm.model_executor.model_loader.reload.utils.get_layer_params_buffers", "vllm.model_executor.model_loader.reload.utils.get_layer_size", "vllm.model_executor.model_loader.reload.utils.get_layer_tensors" ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/tensorizer.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.model_loader.tensorizer.EncryptionParams", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.tensorizer.no_init_or_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.tensorizer.TensorDeserializer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.tensorizer.open_stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.model_loader.tensorizer.TensorizerConfig", "methods": [ { "kind": "function", "name": "TensorizerConfig.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TensorizerConfig.to_serializable", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TensorizerConfig._construct_tensorizer_args", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TensorizerConfig.verify_with_parallel_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TensorizerConfig.verify_with_model_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TensorizerConfig.open_stream", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TensorizerConfig.keys", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TensorizerConfig.__len__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TensorizerConfig.__iter__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TensorizerConfig.__getitem__", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TensorizerConfig.__setitem__", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TensorizerConfig.__delitem__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TensorizerConfig.tensorizer_uri", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig.tensorizer_dir", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig.vllm_tensorized", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig.verify_hash", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig.num_readers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig.encryption_keyfile", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig.s3_access_key_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig.s3_secret_access_key", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig.s3_endpoint", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig.lora_dir", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig.stream_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig.serialization_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig.deserialization_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig._extra_serialization_attrs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig.model_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig.hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig._is_sharded", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig._fields", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TensorizerConfig._keys", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 19, "n_typed": 10, "n_any": 2, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 7, "n_attrs": 20, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.tensorizer.get_mem_usage", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.tensorizer.DecryptionParams", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.tensorizer.convert_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.tensorizer.TensorSerializer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.model_loader.tensorizer", "names": [ "vllm.model_executor.model_loader.tensorizer.DecryptionParams", "vllm.model_executor.model_loader.tensorizer.EncryptionParams", "vllm.model_executor.model_loader.tensorizer.TensorDeserializer", "vllm.model_executor.model_loader.tensorizer.TensorSerializer", "vllm.model_executor.model_loader.tensorizer.TensorizerConfig", "vllm.model_executor.model_loader.tensorizer.convert_bytes", "vllm.model_executor.model_loader.tensorizer.get_mem_usage", "vllm.model_executor.model_loader.tensorizer.no_init_or_tensor", "vllm.model_executor.model_loader.tensorizer.open_stream" ], "n_typable": 27, "n_typed": 10, "n_any": 2, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 7, "n_classes": 1, "n_attrs": 28, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/model_loader/weight_utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.model_loader.weight_utils.SafeTensorsFileLoader", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.weight_utils.SingleGroup", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.get_sparse_attention_config", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.initialize_single_dummy_weight", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.download_weights_from_hf", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.get_gguf_weight_type_map", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.runai_safetensors_weights_iterator", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.enable_xet_high_performance", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.weight_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.fastsafetensors_weights_iterator", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.weight_utils.gguf", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.sharded_weight_loader", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.weight_utils.temp_dir", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.weight_utils.SafetensorsStreamer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.convert_bin_to_safetensor_file", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.maybe_download_from_modelscope", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.np_cache_weights_iterator", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.get_gguf_extra_tensor_names", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.download_safetensors_index_file_from_hf", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.enable_hf_transfer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.convert_pyslice_to_tensor", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.weight_utils.fastsafetensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.weight_utils.runai_model_streamer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.get_lock", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.multi_thread_pt_weights_iterator", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.composed_weight_loader", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.filter_files_not_needed_for_inference", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.model_loader.weight_utils.LoaderFunction", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.download_gguf", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.get_quant_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.pt_weights_iterator", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.filter_duplicate_safetensors_files", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.multi_thread_safetensors_weights_iterator", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.atomic_writer", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.enable_tqdm", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.gguf_quant_weights_iterator", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.maybe_remap_kv_scale_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.initialize_dummy_weights", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.model_loader.weight_utils.DisabledTqdm", "methods": [ { "kind": "function", "name": "DisabledTqdm.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.safetensors_weights_iterator", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.default_weight_loader", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.model_loader.weight_utils.row_parallel_weight_loader", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [ { "kind": "type", "rules": [ "assignment" ] } ], "name": "vllm.model_executor.model_loader.weight_utils", "names": [ "vllm.model_executor.model_loader.weight_utils.DisabledTqdm", "vllm.model_executor.model_loader.weight_utils.LoaderFunction", "vllm.model_executor.model_loader.weight_utils.SafeTensorsFileLoader", "vllm.model_executor.model_loader.weight_utils.SafetensorsStreamer", "vllm.model_executor.model_loader.weight_utils.SingleGroup", "vllm.model_executor.model_loader.weight_utils.atomic_writer", "vllm.model_executor.model_loader.weight_utils.composed_weight_loader", "vllm.model_executor.model_loader.weight_utils.convert_bin_to_safetensor_file", "vllm.model_executor.model_loader.weight_utils.convert_pyslice_to_tensor", "vllm.model_executor.model_loader.weight_utils.default_weight_loader", "vllm.model_executor.model_loader.weight_utils.download_gguf", "vllm.model_executor.model_loader.weight_utils.download_safetensors_index_file_from_hf", "vllm.model_executor.model_loader.weight_utils.download_weights_from_hf", "vllm.model_executor.model_loader.weight_utils.enable_hf_transfer", "vllm.model_executor.model_loader.weight_utils.enable_tqdm", "vllm.model_executor.model_loader.weight_utils.enable_xet_high_performance", "vllm.model_executor.model_loader.weight_utils.fastsafetensors", "vllm.model_executor.model_loader.weight_utils.fastsafetensors_weights_iterator", "vllm.model_executor.model_loader.weight_utils.filter_duplicate_safetensors_files", "vllm.model_executor.model_loader.weight_utils.filter_files_not_needed_for_inference", "vllm.model_executor.model_loader.weight_utils.get_gguf_extra_tensor_names", "vllm.model_executor.model_loader.weight_utils.get_gguf_weight_type_map", "vllm.model_executor.model_loader.weight_utils.get_lock", "vllm.model_executor.model_loader.weight_utils.get_quant_config", "vllm.model_executor.model_loader.weight_utils.get_sparse_attention_config", "vllm.model_executor.model_loader.weight_utils.gguf", "vllm.model_executor.model_loader.weight_utils.gguf_quant_weights_iterator", "vllm.model_executor.model_loader.weight_utils.initialize_dummy_weights", "vllm.model_executor.model_loader.weight_utils.initialize_single_dummy_weight", "vllm.model_executor.model_loader.weight_utils.logger", "vllm.model_executor.model_loader.weight_utils.maybe_download_from_modelscope", "vllm.model_executor.model_loader.weight_utils.maybe_remap_kv_scale_name", "vllm.model_executor.model_loader.weight_utils.multi_thread_pt_weights_iterator", "vllm.model_executor.model_loader.weight_utils.multi_thread_safetensors_weights_iterator", "vllm.model_executor.model_loader.weight_utils.np_cache_weights_iterator", "vllm.model_executor.model_loader.weight_utils.pt_weights_iterator", "vllm.model_executor.model_loader.weight_utils.row_parallel_weight_loader", "vllm.model_executor.model_loader.weight_utils.runai_model_streamer", "vllm.model_executor.model_loader.weight_utils.runai_safetensors_weights_iterator", "vllm.model_executor.model_loader.weight_utils.safetensors_weights_iterator", "vllm.model_executor.model_loader.weight_utils.sharded_weight_loader", "vllm.model_executor.model_loader.weight_utils.temp_dir" ], "n_typable": 128, "n_typed": 112, "n_any": 1, "n_untyped": 15, "n_functions": 32, "n_function_overloads": 32, "n_function_params": 84, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_classes": 1, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/model_executor/models/AXK1.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.AXK1.AXK1Model", "methods": [ { "kind": "function", "name": "AXK1Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AXK1Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AXK1Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AXK1Model.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AXK1Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Model.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 9, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.AXK1.AXK1MoE", "methods": [ { "kind": "function", "name": "AXK1MoE.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AXK1MoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AXK1MoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.n_routed_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.n_shared_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.is_sequence_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.is_rocm_aiter_moe_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.is_fusion_moe_shared_experts_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MoE.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 8, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 21, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.AXK1.get_spec_layer_idx_from_weight_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.AXK1.AXK1Attention", "methods": [ { "kind": "function", "name": "AXK1Attention.__init__", "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "AXK1Attention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AXK1Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.qk_nope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.qk_rope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.qk_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.kv_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.num_local_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.kv_a_proj_with_mqa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.kv_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.kv_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.q_a_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.q_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.q_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Attention.q_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 19, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 17, "n_attrs": 21, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.AXK1.AXK1ForCausalLM", "methods": [ { "kind": "function", "name": "AXK1ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AXK1ForCausalLM.set_moe_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AXK1ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AXK1ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AXK1ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AXK1ForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AXK1ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AXK1ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AXK1ForCausalLM.model_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AXK1ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1ForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1ForCausalLM.use_mha", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1ForCausalLM.fuse_qkv_a_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1ForCausalLM.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 14, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 9, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.AXK1.AXK1MixtureOfExperts", "methods": [ { "kind": "function", "name": "AXK1MixtureOfExperts.extract_moe_parameters", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AXK1MixtureOfExperts.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AXK1MixtureOfExperts.moe_mlp_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.AXK1.AXK1DecoderLayer", "methods": [ { "kind": "function", "name": "AXK1DecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AXK1DecoderLayer._is_layer_sparse", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AXK1DecoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AXK1DecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1DecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1DecoderLayer.use_mha", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1DecoderLayer.is_layer_sparse", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1DecoderLayer.post_mlp_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1DecoderLayer.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 10, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.AXK1.AXK1MLAAttention", "methods": [ { "kind": "function", "name": "AXK1MLAAttention.__init__", "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "AXK1MLAAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AXK1MLAAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.qk_nope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.qk_rope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.qk_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.kv_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.num_local_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.kv_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.kv_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.mla_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.fused_qkv_a_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.q_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.q_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.kv_a_proj_with_mqa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1MLAAttention.q_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 19, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 17, "n_attrs": 21, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.AXK1.AXK1MLP", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.AXK1.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.AXK1", "names": [ "vllm.model_executor.models.AXK1.AXK1Attention", "vllm.model_executor.models.AXK1.AXK1DecoderLayer", "vllm.model_executor.models.AXK1.AXK1ForCausalLM", "vllm.model_executor.models.AXK1.AXK1MLAAttention", "vllm.model_executor.models.AXK1.AXK1MLP", "vllm.model_executor.models.AXK1.AXK1MixtureOfExperts", "vllm.model_executor.models.AXK1.AXK1MoE", "vllm.model_executor.models.AXK1.AXK1Model", "vllm.model_executor.models.AXK1.get_spec_layer_idx_from_weight_name", "vllm.model_executor.models.AXK1.logger" ], "n_typable": 180, "n_typed": 87, "n_any": 0, "n_untyped": 93, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 65, "n_classes": 8, "n_attrs": 94, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/interfaces.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsLoRA", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsMultiModal", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsTranscription", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_transcription", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsPP", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_mrope", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsMRoPE", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.has_inner_state", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.HasInnerState", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_pp", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.interfaces.WeightsMapper", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_mamba_prefix_caching", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.IsAttentionFree", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_realtime", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsEagleBase", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_multimodal_encoder_tp_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.is_hybrid", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.MixtureOfExperts", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_xdrope", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsScoreTemplate", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.interfaces.VllmConfig", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_multimodal_raw_input_only", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.interfaces.IntermediateTensors", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.IsHybrid", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_multimodal_pruning", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.interfaces.MultiModalEmbeddings", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.requires_raw_input_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_score_template", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.HasNoOps", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_eagle", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_cross_encoding", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.is_attention_free", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.is_mixture_of_experts", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsMambaPrefixCaching", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_late_interaction", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_eagle3", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.has_noops", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsRealtime", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces.supports_any_eagle", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsCrossEncoding", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.interfaces.MultiModalFeatureSpec", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsXDRoPE", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsMultiModalPruning", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsEagle3", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsEagle", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsQuant", "methods": [ { "kind": "function", "name": "SupportsQuant.__new__", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SupportsQuant._find_quant_config", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SupportsQuant.hf_to_vllm_mapper", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SupportsQuant.packed_modules_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SupportsQuant.quant_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 9, "n_typed": 5, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces.SupportsLateInteraction", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.interfaces.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.interfaces", "names": [ "vllm.model_executor.models.interfaces.HasInnerState", "vllm.model_executor.models.interfaces.HasNoOps", "vllm.model_executor.models.interfaces.IntermediateTensors", "vllm.model_executor.models.interfaces.IsAttentionFree", "vllm.model_executor.models.interfaces.IsHybrid", "vllm.model_executor.models.interfaces.MixtureOfExperts", "vllm.model_executor.models.interfaces.MultiModalEmbeddings", "vllm.model_executor.models.interfaces.MultiModalFeatureSpec", "vllm.model_executor.models.interfaces.SupportsCrossEncoding", "vllm.model_executor.models.interfaces.SupportsEagle", "vllm.model_executor.models.interfaces.SupportsEagle3", "vllm.model_executor.models.interfaces.SupportsEagleBase", "vllm.model_executor.models.interfaces.SupportsLateInteraction", "vllm.model_executor.models.interfaces.SupportsLoRA", "vllm.model_executor.models.interfaces.SupportsMRoPE", "vllm.model_executor.models.interfaces.SupportsMambaPrefixCaching", "vllm.model_executor.models.interfaces.SupportsMultiModal", "vllm.model_executor.models.interfaces.SupportsMultiModalPruning", "vllm.model_executor.models.interfaces.SupportsPP", "vllm.model_executor.models.interfaces.SupportsQuant", "vllm.model_executor.models.interfaces.SupportsRealtime", "vllm.model_executor.models.interfaces.SupportsScoreTemplate", "vllm.model_executor.models.interfaces.SupportsTranscription", "vllm.model_executor.models.interfaces.SupportsXDRoPE", "vllm.model_executor.models.interfaces.VllmConfig", "vllm.model_executor.models.interfaces.WeightsMapper", "vllm.model_executor.models.interfaces.has_inner_state", "vllm.model_executor.models.interfaces.has_noops", "vllm.model_executor.models.interfaces.is_attention_free", "vllm.model_executor.models.interfaces.is_hybrid", "vllm.model_executor.models.interfaces.is_mixture_of_experts", "vllm.model_executor.models.interfaces.logger", "vllm.model_executor.models.interfaces.requires_raw_input_tokens", "vllm.model_executor.models.interfaces.supports_any_eagle", "vllm.model_executor.models.interfaces.supports_cross_encoding", "vllm.model_executor.models.interfaces.supports_eagle", "vllm.model_executor.models.interfaces.supports_eagle3", "vllm.model_executor.models.interfaces.supports_late_interaction", "vllm.model_executor.models.interfaces.supports_lora", "vllm.model_executor.models.interfaces.supports_mamba_prefix_caching", "vllm.model_executor.models.interfaces.supports_mrope", "vllm.model_executor.models.interfaces.supports_multimodal", "vllm.model_executor.models.interfaces.supports_multimodal_encoder_tp_data", "vllm.model_executor.models.interfaces.supports_multimodal_pruning", "vllm.model_executor.models.interfaces.supports_multimodal_raw_input_only", "vllm.model_executor.models.interfaces.supports_pp", "vllm.model_executor.models.interfaces.supports_realtime", "vllm.model_executor.models.interfaces.supports_score_template", "vllm.model_executor.models.interfaces.supports_transcription", "vllm.model_executor.models.interfaces.supports_xdrope" ], "n_typable": 57, "n_typed": 52, "n_any": 0, "n_untyped": 5, "n_functions": 23, "n_function_overloads": 42, "n_function_params": 23, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_classes": 21, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/interfaces_base.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.interfaces_base.is_text_generation_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces_base.is_pooling_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces_base.VllmModelForPooling", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces_base.VllmModelForTextGeneration", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces_base.get_default_tok_pooling_type", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces_base.is_vllm_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces_base.default_pooling_type", "n_typed": 0, "n_any": 2, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.models.interfaces_base.T", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces_base.get_default_seq_pooling_type", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces_base.get_attn_type", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.interfaces_base.T_co", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.interfaces_base.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.models.interfaces_base.attn_type", "n_typed": 0, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interfaces_base.VllmModel", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.interfaces_base", "names": [ "vllm.model_executor.models.interfaces_base.T", "vllm.model_executor.models.interfaces_base.T_co", "vllm.model_executor.models.interfaces_base.VllmModel", "vllm.model_executor.models.interfaces_base.VllmModelForPooling", "vllm.model_executor.models.interfaces_base.VllmModelForTextGeneration", "vllm.model_executor.models.interfaces_base.attn_type", "vllm.model_executor.models.interfaces_base.default_pooling_type", "vllm.model_executor.models.interfaces_base.get_attn_type", "vllm.model_executor.models.interfaces_base.get_default_seq_pooling_type", "vllm.model_executor.models.interfaces_base.get_default_tok_pooling_type", "vllm.model_executor.models.interfaces_base.is_pooling_model", "vllm.model_executor.models.interfaces_base.is_text_generation_model", "vllm.model_executor.models.interfaces_base.is_vllm_model", "vllm.model_executor.models.interfaces_base.logger" ], "n_typable": 18, "n_typed": 9, "n_any": 6, "n_untyped": 3, "n_functions": 8, "n_function_overloads": 11, "n_function_params": 9, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 3, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/adapters.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.adapters.SEQ_CLS_LOAD_METHODS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.models.adapters.load_weights_using_from_2_way_softmax", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.adapters.seq_cls_model_loader", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.adapters.SequenceClassificationConfig", "methods": [ { "kind": "function", "name": "SequenceClassificationConfig.verify_and_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.adapters.load_weights_no_post_processing", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.adapters.as_seq_cls_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.adapters.as_embedding_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.adapters.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.adapters", "names": [ "vllm.model_executor.models.adapters.SEQ_CLS_LOAD_METHODS", "vllm.model_executor.models.adapters.SequenceClassificationConfig", "vllm.model_executor.models.adapters.as_embedding_model", "vllm.model_executor.models.adapters.as_seq_cls_model", "vllm.model_executor.models.adapters.load_weights_no_post_processing", "vllm.model_executor.models.adapters.load_weights_using_from_2_way_softmax", "vllm.model_executor.models.adapters.logger", "vllm.model_executor.models.adapters.seq_cls_model_loader" ], "n_typable": 16, "n_typed": 9, "n_any": 0, "n_untyped": 7, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 8, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/afmoe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.afmoe.AfmoeAttention", "methods": [ { "kind": "function", "name": "AfmoeAttention.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "AfmoeAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AfmoeAttention.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.is_local_attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.gate_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 36, "n_typed": 15, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 14, "n_attrs": 20, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.afmoe.AfmoeModel", "methods": [ { "kind": "function", "name": "AfmoeModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AfmoeModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AfmoeModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AfmoeModel.make_empty_intermediate_tensors", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AfmoeModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AfmoeModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AfmoeModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeModel.mup_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeModel.aux_hidden_state_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 16, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 11, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.afmoe.AfmoeForCausalLM", "methods": [ { "kind": "function", "name": "AfmoeForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AfmoeForCausalLM.set_eplb_state", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AfmoeForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AfmoeForCausalLM.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AfmoeForCausalLM.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AfmoeForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AfmoeForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AfmoeForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AfmoeForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AfmoeForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AfmoeForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AfmoeForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.expert_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.num_expert_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.moe_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.num_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.num_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.num_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.num_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.num_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeForCausalLM.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 39, "n_typed": 22, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 13, "n_attrs": 19, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.afmoe.AfmoeDecoderLayer", "methods": [ { "kind": "function", "name": "AfmoeDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "AfmoeDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AfmoeDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeDecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeDecoderLayer.moe_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeDecoderLayer.pre_mlp_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeDecoderLayer.post_mlp_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 9, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.afmoe.AfmoeMoE", "methods": [ { "kind": "function", "name": "AfmoeMoE.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AfmoeMoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AfmoeMoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.route_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.score_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.route_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.n_routed_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.n_shared_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.expert_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeMoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 7, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 20, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.afmoe.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.afmoe", "names": [ "vllm.model_executor.models.afmoe.AfmoeAttention", "vllm.model_executor.models.afmoe.AfmoeDecoderLayer", "vllm.model_executor.models.afmoe.AfmoeForCausalLM", "vllm.model_executor.models.afmoe.AfmoeMoE", "vllm.model_executor.models.afmoe.AfmoeModel", "vllm.model_executor.models.afmoe.logger" ], "n_typable": 146, "n_typed": 69, "n_any": 0, "n_untyped": 77, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 51, "n_classes": 5, "n_attrs": 76, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/aimv2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.aimv2.AIMv2Block", "methods": [ { "kind": "function", "name": "AIMv2Block.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AIMv2Block.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AIMv2Block.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Block.norm_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Block.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Block.norm_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aimv2.AIMv2PatchEmbed", "methods": [ { "kind": "function", "name": "AIMv2PatchEmbed.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AIMv2PatchEmbed.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AIMv2PatchEmbed.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2PatchEmbed.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aimv2.AIMv2Transformer", "methods": [ { "kind": "function", "name": "AIMv2Transformer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AIMv2Transformer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AIMv2Transformer.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Transformer.post_trunk_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 6, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aimv2.AIMv2Model", "methods": [ { "kind": "function", "name": "AIMv2Model.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AIMv2Model.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AIMv2Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AIMv2Model.preprocessor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Model.trunk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aimv2.AIMv2ViTPreprocessor", "methods": [ { "kind": "function", "name": "AIMv2ViTPreprocessor.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AIMv2ViTPreprocessor.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AIMv2ViTPreprocessor.patchifier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2ViTPreprocessor.pos_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aimv2.AIMv2SwiGLUFFN", "methods": [ { "kind": "function", "name": "AIMv2SwiGLUFFN.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AIMv2SwiGLUFFN.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AIMv2SwiGLUFFN.fc13", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2SwiGLUFFN.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2SwiGLUFFN.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 5, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aimv2.AIMv2Attention", "methods": [ { "kind": "function", "name": "AIMv2Attention.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AIMv2Attention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AIMv2Attention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Attention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Attention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Attention.qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Attention.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Attention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Attention.num_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 5, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.aimv2", "names": [ "vllm.model_executor.models.aimv2.AIMv2Attention", "vllm.model_executor.models.aimv2.AIMv2Block", "vllm.model_executor.models.aimv2.AIMv2Model", "vllm.model_executor.models.aimv2.AIMv2PatchEmbed", "vllm.model_executor.models.aimv2.AIMv2SwiGLUFFN", "vllm.model_executor.models.aimv2.AIMv2Transformer", "vllm.model_executor.models.aimv2.AIMv2ViTPreprocessor" ], "n_typable": 67, "n_typed": 35, "n_any": 0, "n_untyped": 32, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 27, "n_classes": 7, "n_attrs": 25, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/apertus.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.apertus.ApertusModel", "methods": [ { "kind": "function", "name": "ApertusModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ApertusModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ApertusModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ApertusModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ApertusModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusModel.aux_hidden_state_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 12, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.apertus.ApertusForCausalLM", "methods": [ { "kind": "function", "name": "ApertusForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ApertusForCausalLM.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ApertusForCausalLM.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ApertusForCausalLM._init_model", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ApertusForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ApertusForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ApertusForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ApertusForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ApertusForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ApertusForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ApertusForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 20, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 14, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.apertus.ApertusAttention", "methods": [ { "kind": "function", "name": "ApertusAttention.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "ApertusAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ApertusAttention._init_rotary_emb", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ApertusAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusAttention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusAttention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 18, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 15, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.apertus.ApertusMLP", "methods": [ { "kind": "function", "name": "ApertusMLP.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "ApertusMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ApertusMLP.up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.apertus.ApertusDecoderLayer", "methods": [ { "kind": "function", "name": "ApertusDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ApertusDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ApertusDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusDecoderLayer.attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ApertusDecoderLayer.feedforward_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.apertus", "names": [ "vllm.model_executor.models.apertus.ApertusAttention", "vllm.model_executor.models.apertus.ApertusDecoderLayer", "vllm.model_executor.models.apertus.ApertusForCausalLM", "vllm.model_executor.models.apertus.ApertusMLP", "vllm.model_executor.models.apertus.ApertusModel" ], "n_typable": 107, "n_typed": 67, "n_any": 0, "n_untyped": 40, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 53, "n_classes": 5, "n_attrs": 37, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/arcee.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.arcee.ArceeModel", "methods": [ { "kind": "function", "name": "ArceeModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ArceeModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ArceeModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ArceeModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ArceeModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArceeModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArceeModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArceeModel.aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ArceeModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArceeModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArceeModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.arcee.ArceeDecoderLayer", "methods": [ { "kind": "function", "name": "ArceeDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ArceeDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ArceeDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArceeDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArceeDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArceeDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArceeDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.arcee.ArceeMLP", "methods": [ { "kind": "function", "name": "ArceeMLP.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "ArceeMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ArceeMLP.up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArceeMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArceeMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 10, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.arcee.ArceeForCausalLM", "methods": [ { "kind": "function", "name": "ArceeForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ArceeForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ArceeForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ArceeForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ArceeForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ArceeForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ArceeForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArceeForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArceeForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArceeForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArceeForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 13, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.arcee", "names": [ "vllm.model_executor.models.arcee.ArceeDecoderLayer", "vllm.model_executor.models.arcee.ArceeForCausalLM", "vllm.model_executor.models.arcee.ArceeMLP", "vllm.model_executor.models.arcee.ArceeModel" ], "n_typable": 66, "n_typed": 45, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 33, "n_classes": 4, "n_attrs": 21, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/arctic.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.arctic.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.arctic.ArcticMoE", "methods": [ { "kind": "function", "name": "ArcticMoE.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ArcticMoE.weight_loader", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ArcticMoE.local_moe_fused", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ArcticMoE.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ArcticMoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMoE.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMoE.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMoE.layer_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMoE.top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMoE.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMoE.is_moe_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMoE.reduce_results", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMoE.params_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMoE.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMoE.ws", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMoE.w2s", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 13, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.arctic.ArcticAttention", "methods": [ { "kind": "function", "name": "ArcticAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ArcticAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ArcticAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 7, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.arctic.ArcticForCausalLM", "methods": [ { "kind": "function", "name": "ArcticForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ArcticForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ArcticForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ArcticForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ArcticForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ArcticForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ArcticForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticForCausalLM.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticForCausalLM.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticForCausalLM.num_experts_per_tok", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 13, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.arctic.ArcticDecoderLayer", "methods": [ { "kind": "function", "name": "ArcticDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ArcticDecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ArcticDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticDecoderLayer.use_residual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticDecoderLayer.block_sparse_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticDecoderLayer.residual_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticDecoderLayer.residual_mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 8, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.arctic.ArcticModel", "methods": [ { "kind": "function", "name": "ArcticModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ArcticModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ArcticModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ArcticModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.arctic.ArcticMLP", "methods": [ { "kind": "function", "name": "ArcticMLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ArcticMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ArcticMLP.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMLP.expert_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMLP.ffn_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMLP.w13", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMLP.w2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 6, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.arctic", "names": [ "vllm.model_executor.models.arctic.ArcticAttention", "vllm.model_executor.models.arctic.ArcticDecoderLayer", "vllm.model_executor.models.arctic.ArcticForCausalLM", "vllm.model_executor.models.arctic.ArcticMLP", "vllm.model_executor.models.arctic.ArcticMoE", "vllm.model_executor.models.arctic.ArcticModel", "vllm.model_executor.models.arctic.logger" ], "n_typable": 120, "n_typed": 56, "n_any": 0, "n_untyped": 64, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 47, "n_classes": 6, "n_attrs": 56, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/aria.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.aria.AriaProjectorMLP", "methods": [ { "kind": "function", "name": "AriaProjectorMLP.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AriaProjectorMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AriaProjectorMLP.linear_in", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaProjectorMLP.linear_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaProjectorMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 7, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aria.AriaFusedMoE", "methods": [ { "kind": "function", "name": "AriaFusedMoE.weight_loader", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aria.AriaImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AriaImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AriaImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AriaImagePixelInputs.pixel_mask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aria.AriaVisionTransformer", "methods": [ { "kind": "function", "name": "AriaVisionTransformer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AriaVisionTransformer.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AriaVisionTransformer.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AriaVisionTransformer.post_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aria.AriaTextModel", "methods": [ { "kind": "function", "name": "AriaTextModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AriaTextModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AriaTextModel.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aria.AriaProjector", "methods": [ { "kind": "function", "name": "AriaProjector.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AriaProjector.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AriaProjector.patch_to_query_dict", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaProjector.in_features", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaProjector.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaProjector.kv_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaProjector.hidden_features", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaProjector.output_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaProjector.query", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaProjector.cross_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaProjector.layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaProjector.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 6, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aria.AriaTextMoELayer", "methods": [ { "kind": "function", "name": "AriaTextMoELayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AriaTextMoELayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AriaTextMoELayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaTextMoELayer.router_weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaTextMoELayer.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaTextMoELayer.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aria.AriaDummyInputsBuilder", "methods": [ { "kind": "function", "name": "AriaDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AriaDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aria.AriaMultiModalProcessor", "methods": [ { "kind": "function", "name": "AriaMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AriaMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aria.AriaForConditionalGeneration", "methods": [ { "kind": "function", "name": "AriaForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AriaForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AriaForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AriaForConditionalGeneration._create_patch_attention_mask", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AriaForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AriaForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AriaForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "AriaForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AriaForConditionalGeneration.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AriaForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaForConditionalGeneration.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AriaForConditionalGeneration.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 22, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 15, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aria.AriaProcessingInfo", "methods": [ { "kind": "function", "name": "AriaProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AriaProcessingInfo.get_vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AriaProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AriaProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AriaProcessingInfo.get_num_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aria.AriaTextDecoderLayer", "methods": [ { "kind": "function", "name": "AriaTextDecoderLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AriaTextDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.aria", "names": [ "vllm.model_executor.models.aria.AriaDummyInputsBuilder", "vllm.model_executor.models.aria.AriaForConditionalGeneration", "vllm.model_executor.models.aria.AriaFusedMoE", "vllm.model_executor.models.aria.AriaImagePixelInputs", "vllm.model_executor.models.aria.AriaMultiModalProcessor", "vllm.model_executor.models.aria.AriaProcessingInfo", "vllm.model_executor.models.aria.AriaProjector", "vllm.model_executor.models.aria.AriaProjectorMLP", "vllm.model_executor.models.aria.AriaTextDecoderLayer", "vllm.model_executor.models.aria.AriaTextMoELayer", "vllm.model_executor.models.aria.AriaTextModel", "vllm.model_executor.models.aria.AriaVisionTransformer" ], "n_typable": 109, "n_typed": 77, "n_any": 0, "n_untyped": 32, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 30, "n_method_overloads": 30, "n_method_params": 50, "n_classes": 12, "n_attrs": 31, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/audioflamingo3.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.audioflamingo3.MAX_AUDIO_LEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.audioflamingo3.AudioFlamingo3MultiModalDataParser", "methods": [ { "kind": "function", "name": "AudioFlamingo3MultiModalDataParser._parse_audio_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.audioflamingo3.AudioFlamingo3MultiModalProjector", "methods": [ { "kind": "function", "name": "AudioFlamingo3MultiModalProjector.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioFlamingo3MultiModalProjector.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AudioFlamingo3MultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioFlamingo3MultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioFlamingo3MultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 1, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.audioflamingo3.AudioFlamingo3ForConditionalGeneration", "methods": [ { "kind": "function", "name": "AudioFlamingo3ForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AudioFlamingo3ForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AudioFlamingo3ForConditionalGeneration._parse_and_validate_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioFlamingo3ForConditionalGeneration._process_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioFlamingo3ForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioFlamingo3ForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "AudioFlamingo3ForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioFlamingo3ForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AudioFlamingo3ForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AudioFlamingo3ForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioFlamingo3ForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioFlamingo3ForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioFlamingo3ForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioFlamingo3ForConditionalGeneration.audio_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioFlamingo3ForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioFlamingo3ForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 19, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 12, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.audioflamingo3.AudioFlamingo3FeatureInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AudioFlamingo3FeatureInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AudioFlamingo3FeatureInputs.input_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AudioFlamingo3FeatureInputs.feature_attention_mask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AudioFlamingo3FeatureInputs.chunk_counts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.audioflamingo3.AudioFlamingo3Encoder", "methods": [ { "kind": "function", "name": "AudioFlamingo3Encoder.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioFlamingo3Encoder.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AudioFlamingo3Encoder._get_feat_extract_output_lengths", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AudioFlamingo3Encoder.avg_pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioFlamingo3Encoder.pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 4, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.audioflamingo3.AudioFlamingo3DummyInputsBuilder", "methods": [ { "kind": "function", "name": "AudioFlamingo3DummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioFlamingo3DummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.audioflamingo3.AudioFlamingo3Inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.audioflamingo3.AudioFlamingo3ProcessingInfo", "methods": [ { "kind": "function", "name": "AudioFlamingo3ProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AudioFlamingo3ProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioFlamingo3ProcessingInfo.get_feature_extractor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioFlamingo3ProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AudioFlamingo3ProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 3, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.audioflamingo3.AudioFlamingo3EmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AudioFlamingo3EmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AudioFlamingo3EmbeddingInputs.audio_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.audioflamingo3.AudioFlamingo3MultiModalProcessor", "methods": [ { "kind": "function", "name": "AudioFlamingo3MultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AudioFlamingo3MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AudioFlamingo3MultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.audioflamingo3", "names": [ "vllm.model_executor.models.audioflamingo3.AudioFlamingo3DummyInputsBuilder", "vllm.model_executor.models.audioflamingo3.AudioFlamingo3EmbeddingInputs", "vllm.model_executor.models.audioflamingo3.AudioFlamingo3Encoder", "vllm.model_executor.models.audioflamingo3.AudioFlamingo3FeatureInputs", "vllm.model_executor.models.audioflamingo3.AudioFlamingo3ForConditionalGeneration", "vllm.model_executor.models.audioflamingo3.AudioFlamingo3Inputs", "vllm.model_executor.models.audioflamingo3.AudioFlamingo3MultiModalDataParser", "vllm.model_executor.models.audioflamingo3.AudioFlamingo3MultiModalProcessor", "vllm.model_executor.models.audioflamingo3.AudioFlamingo3MultiModalProjector", "vllm.model_executor.models.audioflamingo3.AudioFlamingo3ProcessingInfo", "vllm.model_executor.models.audioflamingo3.MAX_AUDIO_LEN" ], "n_typable": 77, "n_typed": 54, "n_any": 0, "n_untyped": 23, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 24, "n_method_overloads": 24, "n_method_params": 34, "n_classes": 9, "n_attrs": 21, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/aya_vision.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.aya_vision.AyaVisionProcessingInfo", "methods": [ { "kind": "function", "name": "AyaVisionProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AyaVisionProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AyaVisionProcessingInfo.get_image_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AyaVisionProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AyaVisionProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AyaVisionProcessingInfo.get_num_patches", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 13, "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aya_vision.AyaVisionMultiModalProcessor", "methods": [ { "kind": "function", "name": "AyaVisionMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AyaVisionMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AyaVisionMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aya_vision.AyaVisionMultiModalProjector", "methods": [ { "kind": "function", "name": "AyaVisionMultiModalProjector.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AyaVisionMultiModalProjector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AyaVisionMultiModalProjector.pixel_shuffle", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AyaVisionMultiModalProjector.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AyaVisionMultiModalProjector.downsample_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AyaVisionMultiModalProjector.alignment_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AyaVisionMultiModalProjector.layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AyaVisionMultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AyaVisionMultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AyaVisionMultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 5, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aya_vision.AyaVisionForConditionalGeneration", "methods": [ { "kind": "function", "name": "AyaVisionForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AyaVisionForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AyaVisionForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AyaVisionForConditionalGeneration._image_pixels_to_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AyaVisionForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AyaVisionForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AyaVisionForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AyaVisionForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "AyaVisionForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "AyaVisionForConditionalGeneration.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "AyaVisionForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AyaVisionForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AyaVisionForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AyaVisionForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AyaVisionForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AyaVisionForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AyaVisionForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 24, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 17, "n_attrs": 7, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.aya_vision.AyaVisionImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AyaVisionImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AyaVisionImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AyaVisionImagePixelInputs.num_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.aya_vision.AyaVisionDummyInputsBuilder", "methods": [ { "kind": "function", "name": "AyaVisionDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AyaVisionDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.aya_vision", "names": [ "vllm.model_executor.models.aya_vision.AyaVisionDummyInputsBuilder", "vllm.model_executor.models.aya_vision.AyaVisionForConditionalGeneration", "vllm.model_executor.models.aya_vision.AyaVisionImagePixelInputs", "vllm.model_executor.models.aya_vision.AyaVisionMultiModalProcessor", "vllm.model_executor.models.aya_vision.AyaVisionMultiModalProjector", "vllm.model_executor.models.aya_vision.AyaVisionProcessingInfo" ], "n_typable": 81, "n_typed": 63, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 23, "n_method_overloads": 23, "n_method_params": 40, "n_classes": 6, "n_attrs": 17, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/bagel.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.bagel.BagelForConditionalGeneration", "methods": [ { "kind": "function", "name": "BagelForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BagelForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BagelForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BagelForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BagelForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BagelForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BagelForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BagelForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BagelForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelForConditionalGeneration.vit_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelForConditionalGeneration.connector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelForConditionalGeneration.vit_pos_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 21, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 14, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bagel.BagelDummyInputsBuilder", "methods": [ { "kind": "function", "name": "BagelDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BagelDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bagel.BagelProcessingInfo", "methods": [ { "kind": "function", "name": "BagelProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BagelProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BagelProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BagelProcessingInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.bagel.BagelImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.bagel.BagelImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "BagelImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BagelImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bagel.BagelMultiModalProcessor", "methods": [ { "kind": "function", "name": "BagelMultiModalProcessor._hf_processor_applies_updates", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BagelMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BagelMultiModalProcessor._get_mm_fields_config", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 11, "n_any": 1, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bagel.BagelVisionMLP", "methods": [ { "kind": "function", "name": "BagelVisionMLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BagelVisionMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BagelVisionMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelVisionMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelVisionMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.bagel.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.bagel.PositionEmbedding", "methods": [ { "kind": "function", "name": "PositionEmbedding.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PositionEmbedding._get_2d_sincos_pos_embed", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PositionEmbedding._get_2d_sincos_pos_embed_from_grid", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PositionEmbedding._get_1d_sincos_pos_embed_from_grid", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PositionEmbedding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PositionEmbedding.max_num_patch_per_side", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PositionEmbedding.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 8, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.bagel", "names": [ "vllm.model_executor.models.bagel.BagelDummyInputsBuilder", "vllm.model_executor.models.bagel.BagelForConditionalGeneration", "vllm.model_executor.models.bagel.BagelImageInputs", "vllm.model_executor.models.bagel.BagelImagePixelInputs", "vllm.model_executor.models.bagel.BagelMultiModalProcessor", "vllm.model_executor.models.bagel.BagelProcessingInfo", "vllm.model_executor.models.bagel.BagelVisionMLP", "vllm.model_executor.models.bagel.PositionEmbedding", "vllm.model_executor.models.bagel.logger" ], "n_typable": 89, "n_typed": 66, "n_any": 1, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 24, "n_method_overloads": 24, "n_method_params": 48, "n_classes": 7, "n_attrs": 17, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/baichuan.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.baichuan.BaiChuanBaseForCausalLM", "methods": [ { "kind": "function", "name": "BaiChuanBaseForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaiChuanBaseForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaiChuanBaseForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaiChuanBaseForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaiChuanBaseForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaiChuanBaseForCausalLM.lm_head_weight_loader", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaiChuanBaseForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaiChuanBaseForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanBaseForCausalLM.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanBaseForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanBaseForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanBaseForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanBaseForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanBaseForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 16, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.baichuan.BaiChuanDecoderLayer", "methods": [ { "kind": "function", "name": "BaiChuanDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BaiChuanDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaiChuanDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 9, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.baichuan.BaiChuanMLP", "methods": [ { "kind": "function", "name": "BaiChuanMLP.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BaiChuanMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaiChuanMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 5, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.baichuan.BaiChuanAttention", "methods": [ { "kind": "function", "name": "BaiChuanAttention.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "BaiChuanAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaiChuanAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanAttention.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanAttention.W_pack", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 11, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.baichuan.BaiChuanForCausalLM", "methods": [ { "kind": "function", "name": "BaiChuanForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.baichuan.BaichuanForCausalLM", "methods": [ { "kind": "function", "name": "BaichuanForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.baichuan.BaiChuanModel", "methods": [ { "kind": "function", "name": "BaiChuanModel.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaiChuanModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaiChuanModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaiChuanModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaiChuanModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaiChuanModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 13, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.baichuan", "names": [ "vllm.model_executor.models.baichuan.BaiChuanAttention", "vllm.model_executor.models.baichuan.BaiChuanBaseForCausalLM", "vllm.model_executor.models.baichuan.BaiChuanDecoderLayer", "vllm.model_executor.models.baichuan.BaiChuanForCausalLM", "vllm.model_executor.models.baichuan.BaiChuanMLP", "vllm.model_executor.models.baichuan.BaiChuanModel", "vllm.model_executor.models.baichuan.BaichuanForCausalLM" ], "n_typable": 98, "n_typed": 58, "n_any": 0, "n_untyped": 40, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 49, "n_classes": 7, "n_attrs": 32, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/bailing_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.bailing_moe.BailingMoeBlock", "methods": [ { "kind": "function", "name": "BailingMoeBlock.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BailingMoeBlock.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BailingMoeBlock.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeBlock.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeBlock.attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeBlock.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 8, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bailing_moe.BailingMLP", "methods": [ { "kind": "function", "name": "BailingMLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BailingMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BailingMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bailing_moe.BailingMoeModel", "methods": [ { "kind": "function", "name": "BailingMoeModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BailingMoeModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BailingMoeModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BailingMoeModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BailingMoeModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BailingMoeModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeModel.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeModel.tie_word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeModel.embedding_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeModel.word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 12, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bailing_moe.BailingMoeV2ForCausalLM", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bailing_moe.BailingAttention", "methods": [ { "kind": "function", "name": "BailingAttention.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BailingAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BailingAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.total_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.q_size_per_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.kv_size_per_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.use_qk_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.use_rmsnorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.query_key_value", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.query_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingAttention.key_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 8, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bailing_moe.BailingMoeForCausalLM", "methods": [ { "kind": "function", "name": "BailingMoeForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BailingMoeForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BailingMoeForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BailingMoeForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BailingMoeForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BailingMoeForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BailingMoeForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BailingMoeForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeForCausalLM.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeForCausalLM.tie_word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 15, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bailing_moe.BailingMoE", "methods": [ { "kind": "function", "name": "BailingMoE.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BailingMoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BailingMoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.norm_expert_prob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.num_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.score_function", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.n_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.topk_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.use_grouped_topk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.correction_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.router_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoE.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 7, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 18, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.bailing_moe", "names": [ "vllm.model_executor.models.bailing_moe.BailingAttention", "vllm.model_executor.models.bailing_moe.BailingMLP", "vllm.model_executor.models.bailing_moe.BailingMoE", "vllm.model_executor.models.bailing_moe.BailingMoeBlock", "vllm.model_executor.models.bailing_moe.BailingMoeForCausalLM", "vllm.model_executor.models.bailing_moe.BailingMoeModel", "vllm.model_executor.models.bailing_moe.BailingMoeV2ForCausalLM" ], "n_typable": 121, "n_typed": 56, "n_any": 0, "n_untyped": 65, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 43, "n_classes": 7, "n_attrs": 60, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/bailing_moe_linear.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.bailing_moe_linear.BailingMoeV25", "methods": [ { "kind": "function", "name": "BailingMoeV25.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BailingMoeV25.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BailingMoeV25.layer_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.norm_expert_prob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.num_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.score_function", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.n_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.topk_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.use_grouped_topk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.router_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 6, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bailing_moe_linear.BailingMoeV25MLAAttention", "methods": [ { "kind": "function", "name": "BailingMoeV25MLAAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BailingMoeV25MLAAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BailingMoeV25MLAAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.layer_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.qk_nope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.qk_rope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.qk_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.kv_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.num_local_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.kv_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.kv_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.mla_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.fused_qkv_a_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.q_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.q_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.q_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25MLAAttention.kv_a_proj_with_mqa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 9, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 22, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bailing_moe_linear.BailingMoeV25ForCausalLM", "methods": [ { "kind": "function", "name": "BailingMoeV25ForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BailingMoeV25ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BailingMoeV25ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BailingMoeV25ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BailingMoeV25ForCausalLM.make_empty_intermediate_tensors", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BailingMoeV25ForCausalLM.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BailingMoeV25ForCausalLM.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BailingMoeV25ForCausalLM.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BailingMoeV25ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BailingMoeV25ForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BailingMoeV25ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BailingMoeV25ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25ForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 24, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 14, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bailing_moe_linear.BailingMoeV25DecoderLayer", "methods": [ { "kind": "function", "name": "BailingMoeV25DecoderLayer.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BailingMoeV25DecoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BailingMoeV25DecoderLayer.layer_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25DecoderLayer.attention_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 12, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 7, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.bailing_moe_linear.is_linear_layer", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.bailing_moe_linear.BailingMoeV25Model", "methods": [ { "kind": "function", "name": "BailingMoeV25Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BailingMoeV25Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BailingMoeV25Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BailingMoeV25Model.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BailingMoeV25Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BailingMoeV25Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25Model.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25Model.layer_group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25Model.num_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25Model.decoder_attention_types", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25Model.word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoeV25Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 12, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bailing_moe_linear.BailingMoEGate", "methods": [ { "kind": "function", "name": "BailingMoEGate.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BailingMoEGate.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BailingMoEGate.params_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoEGate.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoEGate.expert_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 3, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bailing_moe_linear.BailingGroupRMSNormGate", "methods": [ { "kind": "function", "name": "BailingGroupRMSNormGate.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BailingGroupRMSNormGate._weight_loader", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 3, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.bailing_moe_linear.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.bailing_moe_linear.BailingMoELinearAttention", "methods": [ { "kind": "function", "name": "BailingMoELinearAttention.get_state_shape", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BailingMoELinearAttention.get_state_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BailingMoELinearAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BailingMoELinearAttention.weight_direct_load", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BailingMoELinearAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BailingMoELinearAttention._forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BailingMoELinearAttention._prefill_and_mix_infer", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BailingMoELinearAttention._decode_infer", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "BailingMoELinearAttention.mamba_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "BailingMoELinearAttention.layer_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.total_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.hidden_inner_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.tp_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.rope_theta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.tp_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.q_size_per_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.kv_size_per_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.use_qk_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.linear_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.linear_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.linear_rope", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.BLOCK", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.query_key_value", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.g_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.group_norm_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.g_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.tp_slope", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.linear_silu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.query_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.key_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BailingMoELinearAttention.slope_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 70, "n_typed": 20, "n_any": 0, "n_untyped": 50, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 26, "n_attrs": 35, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.bailing_moe_linear", "names": [ "vllm.model_executor.models.bailing_moe_linear.BailingGroupRMSNormGate", "vllm.model_executor.models.bailing_moe_linear.BailingMoEGate", "vllm.model_executor.models.bailing_moe_linear.BailingMoELinearAttention", "vllm.model_executor.models.bailing_moe_linear.BailingMoeV25", "vllm.model_executor.models.bailing_moe_linear.BailingMoeV25DecoderLayer", "vllm.model_executor.models.bailing_moe_linear.BailingMoeV25ForCausalLM", "vllm.model_executor.models.bailing_moe_linear.BailingMoeV25MLAAttention", "vllm.model_executor.models.bailing_moe_linear.BailingMoeV25Model", "vllm.model_executor.models.bailing_moe_linear.is_linear_layer", "vllm.model_executor.models.bailing_moe_linear.logger" ], "n_typable": 218, "n_typed": 89, "n_any": 0, "n_untyped": 129, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 33, "n_method_overloads": 33, "n_method_params": 82, "n_classes": 8, "n_attrs": 100, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/bamba.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.bamba.BambaMixerDecoderLayer", "methods": [ { "kind": "function", "name": "BambaMixerDecoderLayer.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BambaMixerDecoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BambaMixerDecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaMixerDecoderLayer.mamba", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaMixerDecoderLayer.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaMixerDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaMixerDecoderLayer.pre_ff_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 9, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bamba.BambaMLP", "methods": [ { "kind": "function", "name": "BambaMLP.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BambaMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BambaMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bamba.BambaAttentionDecoderLayer", "methods": [ { "kind": "function", "name": "BambaAttentionDecoderLayer.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BambaAttentionDecoderLayer.self_attention", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BambaAttentionDecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BambaAttentionDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaAttentionDecoderLayer.pre_ff_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 13, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 13, "n_attrs": 17, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.bamba.ALL_DECODER_LAYER_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bamba.BambaForCausalLM", "methods": [ { "kind": "function", "name": "BambaForCausalLM.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BambaForCausalLM.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BambaForCausalLM.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BambaForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BambaForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BambaForCausalLM.forward", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BambaForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BambaForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BambaForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BambaForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BambaForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaForCausalLM.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaForCausalLM.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 17, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 12, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bamba.BambaModel", "methods": [ { "kind": "function", "name": "BambaModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BambaModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BambaModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BambaModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BambaModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BambaModel.final_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.bamba", "names": [ "vllm.model_executor.models.bamba.ALL_DECODER_LAYER_TYPES", "vllm.model_executor.models.bamba.BambaAttentionDecoderLayer", "vllm.model_executor.models.bamba.BambaForCausalLM", "vllm.model_executor.models.bamba.BambaMLP", "vllm.model_executor.models.bamba.BambaMixerDecoderLayer", "vllm.model_executor.models.bamba.BambaModel" ], "n_typable": 105, "n_typed": 55, "n_any": 0, "n_untyped": 50, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 47, "n_classes": 5, "n_attrs": 42, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/bee.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.bee.BeeDummyInputsBuilder", "methods": [ { "kind": "function", "name": "BeeDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BeeDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bee.BeeMultiModalProjector", "methods": [ { "kind": "function", "name": "BeeMultiModalProjector.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BeeMultiModalProjector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BeeMultiModalProjector.pre_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BeeMultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BeeMultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BeeMultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 2, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bee.BeeProcessingInfo", "methods": [ { "kind": "function", "name": "BeeProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BeeProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BeeProcessingInfo._get_num_unpadded_features", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bee.BeeForConditionalGeneration", "methods": [ { "kind": "function", "name": "BeeForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BeeForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BeeForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.bee", "names": [ "vllm.model_executor.models.bee.BeeDummyInputsBuilder", "vllm.model_executor.models.bee.BeeForConditionalGeneration", "vllm.model_executor.models.bee.BeeMultiModalProjector", "vllm.model_executor.models.bee.BeeProcessingInfo" ], "n_typable": 28, "n_typed": 18, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 14, "n_classes": 4, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/bert.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.bert.BertSelfOutput", "methods": [ { "kind": "function", "name": "BertSelfOutput.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BertSelfOutput.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertSelfOutput.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertSelfOutput.LayerNorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 7, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.BertForTokenClassification", "methods": [ { "kind": "function", "name": "BertForTokenClassification.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BertForTokenClassification.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BertForTokenClassification.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BertForTokenClassification.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertForTokenClassification.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BertForTokenClassification.head_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertForTokenClassification.num_labels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertForTokenClassification.bert", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertForTokenClassification.classifier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertForTokenClassification.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.BertEmbeddingModel", "methods": [ { "kind": "function", "name": "BertEmbeddingModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BertEmbeddingModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BertEmbeddingModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BertEmbeddingModel.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BertEmbeddingModel._build_model", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BertEmbeddingModel._build_pooler", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertEmbeddingModel.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BertEmbeddingModel.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertEmbeddingModel.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 15, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 11, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.SPLADESparsePooler", "methods": [ { "kind": "function", "name": "SPLADESparsePooler.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "SPLADESparsePooler.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SPLADESparsePooler.get_pooling_updates", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SPLADESparsePooler.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SPLADESparsePooler.mlm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SPLADESparsePooler.cls_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SPLADESparsePooler.sep_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SPLADESparsePooler.pooling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SPLADESparsePooler.remove_cls_sep", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.BertEmbedding", "methods": [ { "kind": "function", "name": "BertEmbedding.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BertEmbedding.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertEmbedding.size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertEmbedding.word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertEmbedding.position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertEmbedding.token_type_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertEmbedding.LayerNorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertEmbedding.position_embedding_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 5, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.BertSelfAttention", "methods": [ { "kind": "function", "name": "BertSelfAttention.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BertSelfAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertSelfAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertSelfAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertSelfAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertSelfAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertSelfAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertSelfAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertSelfAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertSelfAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertSelfAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertSelfAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertSelfAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 7, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.BertSpladeSparseEmbeddingModel", "methods": [ { "kind": "function", "name": "BertSpladeSparseEmbeddingModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BertSpladeSparseEmbeddingModel._build_pooler", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BertSpladeSparseEmbeddingModel.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertSpladeSparseEmbeddingModel.mlm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertSpladeSparseEmbeddingModel.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.BertAttention", "methods": [ { "kind": "function", "name": "BertAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BertAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertAttention.self", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertAttention.output", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.BertPooler", "methods": [ { "kind": "function", "name": "BertPooler.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertPooler.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertPooler.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertPooler.head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 1, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.BertPoolingModel", "methods": [ { "kind": "function", "name": "BertPoolingModel.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BertPoolingModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertPoolingModel.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BertPoolingModel.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.BertLayer", "methods": [ { "kind": "function", "name": "BertLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BertLayer.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertLayer.attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertLayer.intermediate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertLayer.output", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.BertEncoder", "methods": [ { "kind": "function", "name": "BertEncoder.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BertEncoder.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertEncoder.layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.BertModel", "methods": [ { "kind": "function", "name": "BertModel.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BertModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BertModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BertModel._load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BertModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertModel.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BertModel.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BertModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertModel.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertModel.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 14, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.BertOutput", "methods": [ { "kind": "function", "name": "BertOutput.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BertOutput.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertOutput.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertOutput.LayerNorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.BertForSequenceClassification", "methods": [ { "kind": "function", "name": "BertForSequenceClassification.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BertForSequenceClassification.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BertForSequenceClassification.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BertForSequenceClassification.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertForSequenceClassification.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BertForSequenceClassification.num_labels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertForSequenceClassification.bert", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertForSequenceClassification.classifier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertForSequenceClassification.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.BertIntermediate", "methods": [ { "kind": "function", "name": "BertIntermediate.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BertIntermediate.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertIntermediate.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertIntermediate.intermediate_act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 7, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert.BertMLMHead", "methods": [ { "kind": "function", "name": "BertMLMHead.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BertMLMHead.tie_weights_with_embeddings", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BertMLMHead.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertMLMHead.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertMLMHead.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertMLMHead.layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertMLMHead.decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 6, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.bert.TOKEN_TYPE_SHIFT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.bert", "names": [ "vllm.model_executor.models.bert.BertAttention", "vllm.model_executor.models.bert.BertEmbedding", "vllm.model_executor.models.bert.BertEmbeddingModel", "vllm.model_executor.models.bert.BertEncoder", "vllm.model_executor.models.bert.BertForSequenceClassification", "vllm.model_executor.models.bert.BertForTokenClassification", "vllm.model_executor.models.bert.BertIntermediate", "vllm.model_executor.models.bert.BertLayer", "vllm.model_executor.models.bert.BertMLMHead", "vllm.model_executor.models.bert.BertModel", "vllm.model_executor.models.bert.BertOutput", "vllm.model_executor.models.bert.BertPooler", "vllm.model_executor.models.bert.BertPoolingModel", "vllm.model_executor.models.bert.BertSelfAttention", "vllm.model_executor.models.bert.BertSelfOutput", "vllm.model_executor.models.bert.BertSpladeSparseEmbeddingModel", "vllm.model_executor.models.bert.SPLADESparsePooler", "vllm.model_executor.models.bert.TOKEN_TYPE_SHIFT" ], "n_typable": 212, "n_typed": 132, "n_any": 0, "n_untyped": 80, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 48, "n_method_overloads": 48, "n_method_params": 106, "n_classes": 17, "n_attrs": 65, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/bert_with_rope.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.bert_with_rope.BertWithRopeAttention", "methods": [ { "kind": "function", "name": "BertWithRopeAttention.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "BertWithRopeAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertWithRopeAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 10, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert_with_rope.BertWithRopeMLP", "methods": [ { "kind": "function", "name": "BertWithRopeMLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BertWithRopeMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertWithRopeMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeMLP.up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert_with_rope.BertWithRopeEncoder", "methods": [ { "kind": "function", "name": "BertWithRopeEncoder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BertWithRopeEncoder.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertWithRopeEncoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert_with_rope.NomicMoE", "methods": [ { "kind": "function", "name": "NomicMoE.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "NomicMoE.weight_loader", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "NomicMoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NomicMoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NomicMoE.num_total_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NomicMoE.top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NomicMoE.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NomicMoE.total_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NomicMoE.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NomicMoE.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NomicMoE.params_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NomicMoE.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NomicMoE.w1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NomicMoE.w2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NomicMoE.bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 12, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert_with_rope.BertWithRopeBlock", "methods": [ { "kind": "function", "name": "BertWithRopeBlock.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "BertWithRopeBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertWithRopeBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeBlock.attn_ln", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeBlock.mlp_ln", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 9, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert_with_rope.SnowflakeGteNewModel", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SnowflakeGteNewModel.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert_with_rope.JinaRobertaModel", "methods": [ { "kind": "function", "name": "JinaRobertaModel.jina_merge_lora_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "JinaRobertaModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JinaRobertaModel.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert_with_rope.BertWithRopeEmbedding", "methods": [ { "kind": "function", "name": "BertWithRopeEmbedding.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BertWithRopeEmbedding.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertWithRopeEmbedding.word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeEmbedding.LayerNorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeEmbedding.token_type_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 4, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert_with_rope.BertWithRopeGatedMLP", "methods": [ { "kind": "function", "name": "BertWithRopeGatedMLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BertWithRopeGatedMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertWithRopeGatedMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeGatedMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRopeGatedMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert_with_rope.GteNewForSequenceClassification", "methods": [ { "kind": "function", "name": "GteNewForSequenceClassification.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GteNewForSequenceClassification.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GteNewForSequenceClassification.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GteNewForSequenceClassification.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GteNewForSequenceClassification.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GteNewForSequenceClassification.new", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GteNewForSequenceClassification.classifier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GteNewForSequenceClassification.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert_with_rope.GteNewModel", "methods": [ { "kind": "function", "name": "GteNewModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GteNewModel.split_up_gate_proj", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GteNewModel.ignore_unnecessary_layers", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GteNewModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GteNewModel.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert_with_rope.NomicBertModel", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NomicBertModel.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bert_with_rope.BertWithRope", "methods": [ { "kind": "function", "name": "BertWithRope.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BertWithRope.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BertWithRope.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BertWithRope.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BertWithRope.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRope.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRope.add_pooling_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRope.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRope.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRope.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BertWithRope.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 13, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.bert_with_rope", "names": [ "vllm.model_executor.models.bert_with_rope.BertWithRope", "vllm.model_executor.models.bert_with_rope.BertWithRopeAttention", "vllm.model_executor.models.bert_with_rope.BertWithRopeBlock", "vllm.model_executor.models.bert_with_rope.BertWithRopeEmbedding", "vllm.model_executor.models.bert_with_rope.BertWithRopeEncoder", "vllm.model_executor.models.bert_with_rope.BertWithRopeGatedMLP", "vllm.model_executor.models.bert_with_rope.BertWithRopeMLP", "vllm.model_executor.models.bert_with_rope.GteNewForSequenceClassification", "vllm.model_executor.models.bert_with_rope.GteNewModel", "vllm.model_executor.models.bert_with_rope.JinaRobertaModel", "vllm.model_executor.models.bert_with_rope.NomicBertModel", "vllm.model_executor.models.bert_with_rope.NomicMoE", "vllm.model_executor.models.bert_with_rope.SnowflakeGteNewModel" ], "n_typable": 160, "n_typed": 90, "n_any": 0, "n_untyped": 70, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 29, "n_method_overloads": 29, "n_method_params": 78, "n_classes": 13, "n_attrs": 54, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/blip.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.blip.BlipEncoder", "methods": [ { "kind": "function", "name": "BlipEncoder.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BlipEncoder.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlipEncoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipEncoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 6, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.blip.get_blip_num_patches", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.blip.BlipMLP", "methods": [ { "kind": "function", "name": "BlipMLP.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BlipMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlipMLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipMLP.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.blip.BlipEncoderLayer", "methods": [ { "kind": "function", "name": "BlipEncoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BlipEncoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlipEncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipEncoderLayer.layer_norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipEncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipEncoderLayer.layer_norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.blip.BlipVisionModel", "methods": [ { "kind": "function", "name": "BlipVisionModel.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BlipVisionModel.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BlipVisionModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlipVisionModel.config_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlipVisionModel.main_input_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlipVisionModel.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlipVisionModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipVisionModel.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipVisionModel.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipVisionModel.post_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 10, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 7, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.blip.get_blip_patch_grid_length", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.blip.BlipVisionEmbeddings", "methods": [ { "kind": "function", "name": "BlipVisionEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BlipVisionEmbeddings.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlipVisionEmbeddings.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipVisionEmbeddings.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipVisionEmbeddings.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipVisionEmbeddings.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipVisionEmbeddings.class_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipVisionEmbeddings.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipVisionEmbeddings.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipVisionEmbeddings.num_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipVisionEmbeddings.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 3, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.blip.BlipAttention", "methods": [ { "kind": "function", "name": "BlipAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BlipAttention._shape", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BlipAttention.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlipAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipAttention.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipAttention.qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipAttention.projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipAttention.num_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlipAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 8, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 11, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.blip", "names": [ "vllm.model_executor.models.blip.BlipAttention", "vllm.model_executor.models.blip.BlipEncoder", "vllm.model_executor.models.blip.BlipEncoderLayer", "vllm.model_executor.models.blip.BlipMLP", "vllm.model_executor.models.blip.BlipVisionEmbeddings", "vllm.model_executor.models.blip.BlipVisionModel", "vllm.model_executor.models.blip.get_blip_num_patches", "vllm.model_executor.models.blip.get_blip_patch_grid_length" ], "n_typable": 83, "n_typed": 45, "n_any": 0, "n_untyped": 38, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 4, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 29, "n_classes": 6, "n_attrs": 37, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/blip2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.blip2.Blip2ImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Blip2ImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Blip2ImagePixelInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.blip2.Blip2ProcessingInfo", "methods": [ { "kind": "function", "name": "Blip2ProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Blip2ProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Blip2ProcessingInfo.get_num_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.blip2.Blip2QFormerModel", "methods": [ { "kind": "function", "name": "Blip2QFormerModel.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Blip2QFormerModel.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Blip2QFormerModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerModel.layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerModel.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerModel.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.blip2.Blip2QFormerSelfOutput", "methods": [ { "kind": "function", "name": "Blip2QFormerSelfOutput.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Blip2QFormerSelfOutput.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Blip2QFormerSelfOutput.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerSelfOutput.LayerNorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerSelfOutput.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 6, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.blip2.Blip2QFormerAttention", "methods": [ { "kind": "function", "name": "Blip2QFormerAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Blip2QFormerAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Blip2QFormerAttention.attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerAttention.output", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.blip2.Blip2DummyInputsBuilder", "methods": [ { "kind": "function", "name": "Blip2DummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Blip2DummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.blip2.Blip2MultiModalProcessor", "methods": [ { "kind": "function", "name": "Blip2MultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Blip2MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Blip2MultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.blip2.Blip2QFormerOutput", "methods": [ { "kind": "function", "name": "Blip2QFormerOutput.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Blip2QFormerOutput.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Blip2QFormerOutput.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerOutput.LayerNorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerOutput.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 6, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.blip2.Blip2ImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Blip2ImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Blip2ImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.blip2.Blip2QFormerIntermediate", "methods": [ { "kind": "function", "name": "Blip2QFormerIntermediate.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Blip2QFormerIntermediate.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Blip2QFormerIntermediate.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerIntermediate.intermediate_act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.blip2.Blip2QFormerMultiHeadAttention", "methods": [ { "kind": "function", "name": "Blip2QFormerMultiHeadAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Blip2QFormerMultiHeadAttention.transpose_for_scores", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Blip2QFormerMultiHeadAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Blip2QFormerMultiHeadAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerMultiHeadAttention.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerMultiHeadAttention.attention_head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerMultiHeadAttention.all_head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerMultiHeadAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerMultiHeadAttention.query", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerMultiHeadAttention.key", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerMultiHeadAttention.value", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerMultiHeadAttention.position_embedding_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerMultiHeadAttention.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 8, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.blip2.Blip2ImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.blip2.Blip2QFormerEncoder", "methods": [ { "kind": "function", "name": "Blip2QFormerEncoder.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Blip2QFormerEncoder.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Blip2QFormerEncoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerEncoder.layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.blip2.Blip2QFormerLayer", "methods": [ { "kind": "function", "name": "Blip2QFormerLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Blip2QFormerLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Blip2QFormerLayer.feed_forward_chunk", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Blip2QFormerLayer.feed_forward_chunk_query", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Blip2QFormerLayer.chunk_size_feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerLayer.seq_len_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerLayer.attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerLayer.intermediate_query", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerLayer.output_query", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerLayer.crossattention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2QFormerLayer.has_cross_attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 13, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.blip2.Blip2ForConditionalGeneration", "methods": [ { "kind": "function", "name": "Blip2ForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Blip2ForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Blip2ForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Blip2ForConditionalGeneration._image_pixels_to_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Blip2ForConditionalGeneration._process_image_pixels", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Blip2ForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Blip2ForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Blip2ForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Blip2ForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Blip2ForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Blip2ForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Blip2ForConditionalGeneration.get_num_mm_encoder_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Blip2ForConditionalGeneration.get_num_mm_connector_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Blip2ForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2ForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2ForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2ForConditionalGeneration.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2ForConditionalGeneration.query_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2ForConditionalGeneration.qformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2ForConditionalGeneration.language_projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Blip2ForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 31, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 19, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.blip2", "names": [ "vllm.model_executor.models.blip2.Blip2DummyInputsBuilder", "vllm.model_executor.models.blip2.Blip2ForConditionalGeneration", "vllm.model_executor.models.blip2.Blip2ImageEmbeddingInputs", "vllm.model_executor.models.blip2.Blip2ImageInputs", "vllm.model_executor.models.blip2.Blip2ImagePixelInputs", "vllm.model_executor.models.blip2.Blip2MultiModalProcessor", "vllm.model_executor.models.blip2.Blip2ProcessingInfo", "vllm.model_executor.models.blip2.Blip2QFormerAttention", "vllm.model_executor.models.blip2.Blip2QFormerEncoder", "vllm.model_executor.models.blip2.Blip2QFormerIntermediate", "vllm.model_executor.models.blip2.Blip2QFormerLayer", "vllm.model_executor.models.blip2.Blip2QFormerModel", "vllm.model_executor.models.blip2.Blip2QFormerMultiHeadAttention", "vllm.model_executor.models.blip2.Blip2QFormerOutput", "vllm.model_executor.models.blip2.Blip2QFormerSelfOutput" ], "n_typable": 168, "n_typed": 120, "n_any": 0, "n_untyped": 48, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 40, "n_method_overloads": 40, "n_method_params": 81, "n_classes": 14, "n_attrs": 47, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/bloom.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.bloom.BloomMLP", "methods": [ { "kind": "function", "name": "BloomMLP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BloomMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BloomMLP.dense_h_to_4h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomMLP.gelu_impl", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomMLP.dense_4h_to_h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 5, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bloom.BloomAttention", "methods": [ { "kind": "function", "name": "BloomAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BloomAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BloomAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomAttention.query_key_value", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomAttention.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 7, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bloom.BloomModel", "methods": [ { "kind": "function", "name": "BloomModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BloomModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BloomModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BloomModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BloomModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomModel.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomModel.word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomModel.word_embeddings_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomModel.ln_f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bloom.BloomBlock", "methods": [ { "kind": "function", "name": "BloomBlock.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BloomBlock.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BloomBlock.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomBlock.self_attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomBlock.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomBlock.apply_residual_connection_post_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 7, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.bloom.BloomForCausalLM", "methods": [ { "kind": "function", "name": "BloomForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BloomForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BloomForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BloomForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BloomForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BloomForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomForCausalLM.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BloomForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.bloom", "names": [ "vllm.model_executor.models.bloom.BloomAttention", "vllm.model_executor.models.bloom.BloomBlock", "vllm.model_executor.models.bloom.BloomForCausalLM", "vllm.model_executor.models.bloom.BloomMLP", "vllm.model_executor.models.bloom.BloomModel" ], "n_typable": 75, "n_typed": 43, "n_any": 0, "n_untyped": 32, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 33, "n_classes": 5, "n_attrs": 27, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/chameleon.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonAttention", "methods": [ { "kind": "function", "name": "ChameleonAttention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "ChameleonAttention._apply_qk_norm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ChameleonAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChameleonAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonAttention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonAttention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 16, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 13, "n_attrs": 16, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonImageVocabularyMapping", "methods": [ { "kind": "function", "name": "ChameleonImageVocabularyMapping.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChameleonImageVocabularyMapping.convert_img2bpe", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "ChameleonImageVocabularyMapping.val2name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ChameleonImageVocabularyMapping.image_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ChameleonImageVocabularyMapping.bpe2img", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ChameleonImageVocabularyMapping.img2bpe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ChameleonImageVocabularyMapping.bpe2img_search_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ChameleonImageVocabularyMapping.img2bpe_mapping_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ChameleonImageVocabularyMapping.vocab_map", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonImageVocabularyMapping.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 3, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 2, "n_properties": 6 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonDummyInputsBuilder", "methods": [ { "kind": "function", "name": "ChameleonDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChameleonDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonMultiModalProcessor", "methods": [ { "kind": "function", "name": "ChameleonMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ChameleonMultiModalProcessor._apply_hf_processor_tokens_only", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChameleonMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ChameleonMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 14, "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonVQVAEEncoderResnetBlock", "methods": [ { "kind": "function", "name": "ChameleonVQVAEEncoderResnetBlock.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ChameleonVQVAEEncoderResnetBlock.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChameleonVQVAEEncoderResnetBlock.in_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoderResnetBlock.out_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoderResnetBlock.use_conv_shortcut", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoderResnetBlock.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoderResnetBlock.conv1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoderResnetBlock.norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoderResnetBlock.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoderResnetBlock.conv2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoderResnetBlock.conv_shortcut", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoderResnetBlock.nin_shortcut", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 3, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonVQVAEEncoderConvDownsample", "methods": [ { "kind": "function", "name": "ChameleonVQVAEEncoderConvDownsample.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChameleonVQVAEEncoderConvDownsample.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChameleonVQVAEEncoderConvDownsample.conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonVQVAEVectorQuantizer", "methods": [ { "kind": "function", "name": "ChameleonVQVAEVectorQuantizer.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChameleonVQVAEVectorQuantizer.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChameleonVQVAEVectorQuantizer.num_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEVectorQuantizer.embedding_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEVectorQuantizer.beta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEVectorQuantizer.embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEVectorQuantizer.re_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 2, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonDecoderLayer", "methods": [ { "kind": "function", "name": "ChameleonDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ChameleonDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChameleonDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChameleonImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonImagePixelInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonSwinDecoderLayer", "methods": [ { "kind": "function", "name": "ChameleonSwinDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ChameleonSwinDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChameleonSwinDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonSwinDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonSwinDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonSwinDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonSwinDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonMLP", "methods": [ { "kind": "function", "name": "ChameleonMLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ChameleonMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChameleonMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonVQVAEEncoder", "methods": [ { "kind": "function", "name": "ChameleonVQVAEEncoder.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChameleonVQVAEEncoder.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChameleonVQVAEEncoder.num_resolutions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoder.num_res_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoder.conv_in", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoder.in_channel_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoder.down", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoder.mid", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoder.norm_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoder.conv_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 2, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonModel", "methods": [ { "kind": "function", "name": "ChameleonModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ChameleonModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChameleonModel.get_image_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChameleonModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChameleonModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonModel.vocabulary_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonModel.vqmodel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 11, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonLayerNorm", "methods": [ { "kind": "function", "name": "ChameleonLayerNorm.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ChameleonLayerNorm.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChameleonLayerNorm.normalized_shape", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonVQVAE", "methods": [ { "kind": "function", "name": "ChameleonVQVAE.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChameleonVQVAE.encode", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChameleonVQVAE.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAE.quantize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAE.quant_conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAE.post_quant_conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 3, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonVQVAEEncoderAttnBlock", "methods": [ { "kind": "function", "name": "ChameleonVQVAEEncoderAttnBlock.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChameleonVQVAEEncoderAttnBlock.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChameleonVQVAEEncoderAttnBlock.in_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoderAttnBlock.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoderAttnBlock.q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoderAttnBlock.k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoderAttnBlock.v", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonVQVAEEncoderAttnBlock.proj_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 2, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonForConditionalGeneration", "methods": [ { "kind": "function", "name": "ChameleonForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ChameleonForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ChameleonForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChameleonForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChameleonForConditionalGeneration.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ChameleonForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChameleonForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChameleonForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChameleonForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonForConditionalGeneration.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonForConditionalGeneration.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChameleonForConditionalGeneration.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 18, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 13, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chameleon.ChameleonProcessingInfo", "methods": [ { "kind": "function", "name": "ChameleonProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ChameleonProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChameleonProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ChameleonProcessingInfo.get_num_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.chameleon.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.chameleon", "names": [ "vllm.model_executor.models.chameleon.ChameleonAttention", "vllm.model_executor.models.chameleon.ChameleonDecoderLayer", "vllm.model_executor.models.chameleon.ChameleonDummyInputsBuilder", "vllm.model_executor.models.chameleon.ChameleonForConditionalGeneration", "vllm.model_executor.models.chameleon.ChameleonImagePixelInputs", "vllm.model_executor.models.chameleon.ChameleonImageVocabularyMapping", "vllm.model_executor.models.chameleon.ChameleonLayerNorm", "vllm.model_executor.models.chameleon.ChameleonMLP", "vllm.model_executor.models.chameleon.ChameleonModel", "vllm.model_executor.models.chameleon.ChameleonMultiModalProcessor", "vllm.model_executor.models.chameleon.ChameleonProcessingInfo", "vllm.model_executor.models.chameleon.ChameleonSwinDecoderLayer", "vllm.model_executor.models.chameleon.ChameleonVQVAE", "vllm.model_executor.models.chameleon.ChameleonVQVAEEncoder", "vllm.model_executor.models.chameleon.ChameleonVQVAEEncoderAttnBlock", "vllm.model_executor.models.chameleon.ChameleonVQVAEEncoderConvDownsample", "vllm.model_executor.models.chameleon.ChameleonVQVAEEncoderResnetBlock", "vllm.model_executor.models.chameleon.ChameleonVQVAEVectorQuantizer", "vllm.model_executor.models.chameleon.logger" ], "n_typable": 225, "n_typed": 112, "n_any": 0, "n_untyped": 113, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 46, "n_method_overloads": 46, "n_method_params": 91, "n_classes": 18, "n_attrs": 83, "n_properties": 6, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/chatglm.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.chatglm.ChatGLMForCausalLM", "methods": [ { "kind": "function", "name": "ChatGLMForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ChatGLMForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatGLMForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chatglm.ChatGLMModel", "methods": [ { "kind": "function", "name": "ChatGLMModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ChatGLMModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChatGLMModel.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ChatGLMModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatGLMModel.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChatGLMModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMModel.embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMModel.num_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMModel.multi_query_group_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMModel.kv_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMModel.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMModel.output_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 12, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chatglm.ChatGLMBaseModel", "methods": [ { "kind": "function", "name": "ChatGLMBaseModel.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ChatGLMBaseModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChatGLMBaseModel.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChatGLMBaseModel.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatGLMBaseModel.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMBaseModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMBaseModel.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMBaseModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMBaseModel.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMBaseModel.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMBaseModel.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMBaseModel.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMBaseModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 9, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chatglm.GLMMLP", "methods": [ { "kind": "function", "name": "GLMMLP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GLMMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GLMMLP.add_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMMLP.dense_h_to_4h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMMLP.activation_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMMLP.dense_4h_to_h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 3, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chatglm.GLMAttention", "methods": [ { "kind": "function", "name": "GLMAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GLMAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GLMAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMAttention.multi_query_attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMAttention.query_key_value", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMAttention.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 7, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chatglm.GLMTransformer", "methods": [ { "kind": "function", "name": "GLMTransformer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GLMTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GLMTransformer.post_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMTransformer.num_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMTransformer.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMTransformer.final_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.chatglm.GLMBlock", "methods": [ { "kind": "function", "name": "GLMBlock.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GLMBlock.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GLMBlock.apply_residual_connection_post_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMBlock.fp32_residual_connection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMBlock.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMBlock.self_attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMBlock.hidden_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMBlock.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLMBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 7, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.chatglm", "names": [ "vllm.model_executor.models.chatglm.ChatGLMBaseModel", "vllm.model_executor.models.chatglm.ChatGLMForCausalLM", "vllm.model_executor.models.chatglm.ChatGLMModel", "vllm.model_executor.models.chatglm.GLMAttention", "vllm.model_executor.models.chatglm.GLMBlock", "vllm.model_executor.models.chatglm.GLMMLP", "vllm.model_executor.models.chatglm.GLMTransformer" ], "n_typable": 107, "n_typed": 52, "n_any": 0, "n_untyped": 55, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 43, "n_classes": 7, "n_attrs": 48, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/clip.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.clip.CLIPTextEmbeddings", "methods": [ { "kind": "function", "name": "CLIPTextEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CLIPTextEmbeddings.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CLIPTextEmbeddings.token_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPTextEmbeddings.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.clip.CLIPEncoder", "methods": [ { "kind": "function", "name": "CLIPEncoder.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CLIPEncoder.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CLIPEncoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPEncoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.clip.CLIPVisionTransformer", "methods": [ { "kind": "function", "name": "CLIPVisionTransformer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CLIPVisionTransformer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CLIPVisionTransformer.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "CLIPVisionTransformer.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "CLIPVisionTransformer.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "CLIPVisionTransformer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPVisionTransformer.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPVisionTransformer.pre_layrnorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPVisionTransformer.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPVisionTransformer.post_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 12, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 5, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.clip.CLIPImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CLIPImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CLIPImagePixelInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.clip.CLIPEncoderLayer", "methods": [ { "kind": "function", "name": "CLIPEncoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CLIPEncoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CLIPEncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPEncoderLayer.layer_norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPEncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPEncoderLayer.layer_norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.clip.CLIPTextTransformer", "methods": [ { "kind": "function", "name": "CLIPTextTransformer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CLIPTextTransformer.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CLIPTextTransformer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CLIPTextTransformer.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CLIPTextTransformer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPTextTransformer.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPTextTransformer.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPTextTransformer.final_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 12, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.clip.CLIPEncoderInfo", "methods": [ { "kind": "function", "name": "CLIPEncoderInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CLIPEncoderInfo.get_image_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CLIPEncoderInfo.get_patch_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CLIPEncoderInfo.get_patch_grid_length", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.clip.CLIPMultiModalProcessor", "methods": [ { "kind": "function", "name": "CLIPMultiModalProcessor.apply", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CLIPMultiModalProcessor._hf_processor_applies_updates", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CLIPMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CLIPMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "CLIPMultiModalProcessor.image_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.clip.CLIPMLP", "methods": [ { "kind": "function", "name": "CLIPMLP.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CLIPMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CLIPMLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPMLP.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.clip.CLIPProcessingInfo", "methods": [ { "kind": "function", "name": "CLIPProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CLIPProcessingInfo.get_vision_encoder_info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CLIPProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CLIPProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CLIPProcessingInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CLIPProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CLIPProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 7, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.clip.CLIPEmbeddingModel", "methods": [ { "kind": "function", "name": "CLIPEmbeddingModel.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CLIPEmbeddingModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CLIPEmbeddingModel.get_text_features", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CLIPEmbeddingModel.get_image_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CLIPEmbeddingModel._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CLIPEmbeddingModel._process_image_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CLIPEmbeddingModel._embed_text_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CLIPEmbeddingModel.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CLIPEmbeddingModel.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CLIPEmbeddingModel.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CLIPEmbeddingModel.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CLIPEmbeddingModel.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CLIPEmbeddingModel.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CLIPEmbeddingModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPEmbeddingModel.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPEmbeddingModel.projection_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPEmbeddingModel.text_embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPEmbeddingModel.vision_embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPEmbeddingModel.pooler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPEmbeddingModel.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPEmbeddingModel.text_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPEmbeddingModel.text_projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPEmbeddingModel.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPEmbeddingModel.visual_projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 48, "n_typed": 35, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 26, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.clip.CLIPDummyInputsBuilder", "methods": [ { "kind": "function", "name": "CLIPDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CLIPDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.clip.CLIPVisionEmbeddings", "methods": [ { "kind": "function", "name": "CLIPVisionEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CLIPVisionEmbeddings.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CLIPVisionEmbeddings.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPVisionEmbeddings.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPVisionEmbeddings.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPVisionEmbeddings.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPVisionEmbeddings.class_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPVisionEmbeddings.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPVisionEmbeddings.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPVisionEmbeddings.num_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPVisionEmbeddings.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 3, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.clip.CLIPVisionModel", "methods": [ { "kind": "function", "name": "CLIPVisionModel.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CLIPVisionModel.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "CLIPVisionModel.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "CLIPVisionModel.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "CLIPVisionModel.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 10, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 1, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.clip.CLIPAttention", "methods": [ { "kind": "function", "name": "CLIPAttention.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CLIPAttention.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CLIPAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPAttention.num_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CLIPAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 6, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.clip", "names": [ "vllm.model_executor.models.clip.CLIPAttention", "vllm.model_executor.models.clip.CLIPDummyInputsBuilder", "vllm.model_executor.models.clip.CLIPEmbeddingModel", "vllm.model_executor.models.clip.CLIPEncoder", "vllm.model_executor.models.clip.CLIPEncoderInfo", "vllm.model_executor.models.clip.CLIPEncoderLayer", "vllm.model_executor.models.clip.CLIPImagePixelInputs", "vllm.model_executor.models.clip.CLIPMLP", "vllm.model_executor.models.clip.CLIPMultiModalProcessor", "vllm.model_executor.models.clip.CLIPProcessingInfo", "vllm.model_executor.models.clip.CLIPTextEmbeddings", "vllm.model_executor.models.clip.CLIPTextTransformer", "vllm.model_executor.models.clip.CLIPVisionEmbeddings", "vllm.model_executor.models.clip.CLIPVisionModel", "vllm.model_executor.models.clip.CLIPVisionTransformer" ], "n_typable": 206, "n_typed": 142, "n_any": 0, "n_untyped": 64, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 49, "n_method_overloads": 49, "n_method_params": 98, "n_classes": 15, "n_attrs": 56, "n_properties": 5, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/cohere2_vision.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.cohere2_vision.Cohere2VisionForConditionalGeneration", "methods": [ { "kind": "function", "name": "Cohere2VisionForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Cohere2VisionForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Cohere2VisionForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Cohere2VisionForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Cohere2VisionForConditionalGeneration._patch_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Cohere2VisionForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Cohere2VisionForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Cohere2VisionForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Cohere2VisionForConditionalGeneration.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Cohere2VisionForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Cohere2VisionForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Cohere2VisionForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Cohere2VisionForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Cohere2VisionForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Cohere2VisionForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Cohere2VisionForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 20, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 15, "n_attrs": 7, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.cohere2_vision.Cohere2VisionDummyInputsBuilder", "methods": [ { "kind": "function", "name": "Cohere2VisionDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Cohere2VisionDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.cohere2_vision.Cohere2VisionMultiModalProcessor", "methods": [ { "kind": "function", "name": "Cohere2VisionMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Cohere2VisionMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Cohere2VisionMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.cohere2_vision.Cohere2VisionProcessingInfo", "methods": [ { "kind": "function", "name": "Cohere2VisionProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Cohere2VisionProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Cohere2VisionProcessingInfo.get_image_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Cohere2VisionProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Cohere2VisionProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Cohere2VisionProcessingInfo.get_num_patches", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.cohere2_vision.Cohere2VisionMultiModalProjector", "methods": [ { "kind": "function", "name": "Cohere2VisionMultiModalProjector.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Cohere2VisionMultiModalProjector.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Cohere2VisionMultiModalProjector.pixel_shuffle", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Cohere2VisionMultiModalProjector.downsample_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Cohere2VisionMultiModalProjector.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Cohere2VisionMultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Cohere2VisionMultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Cohere2VisionMultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 4, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.cohere2_vision.Cohere2VisionImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Cohere2VisionImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Cohere2VisionImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Cohere2VisionImagePixelInputs.num_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.cohere2_vision", "names": [ "vllm.model_executor.models.cohere2_vision.Cohere2VisionDummyInputsBuilder", "vllm.model_executor.models.cohere2_vision.Cohere2VisionForConditionalGeneration", "vllm.model_executor.models.cohere2_vision.Cohere2VisionImagePixelInputs", "vllm.model_executor.models.cohere2_vision.Cohere2VisionMultiModalProcessor", "vllm.model_executor.models.cohere2_vision.Cohere2VisionMultiModalProjector", "vllm.model_executor.models.cohere2_vision.Cohere2VisionProcessingInfo" ], "n_typable": 76, "n_typed": 56, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 22, "n_method_overloads": 22, "n_method_params": 38, "n_classes": 6, "n_attrs": 15, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/colbert.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.colbert.ColBERTModel", "methods": [ { "kind": "function", "name": "ColBERTModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ColBERTModel._build_model", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ColBERTModel._build_pooler", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColBERTModel.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.colbert.ColBERTJinaRobertaModel", "methods": [ { "kind": "function", "name": "ColBERTJinaRobertaModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ColBERTJinaRobertaModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColBERTJinaRobertaModel.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ColBERTJinaRobertaModel.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ColBERTJinaRobertaModel.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ColBERTJinaRobertaModel.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColBERTJinaRobertaModel.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.colbert.ColBERTMixin", "methods": [ { "kind": "function", "name": "ColBERTMixin._init_colbert_components", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ColBERTMixin._build_colbert_linear", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ColBERTMixin._build_colbert_pooler", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColBERTMixin.get_colbert_dim_from_config", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColBERTMixin._load_colbert_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ColBERTMixin.supports_late_interaction", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ColBERTMixin.colbert_dim", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ColBERTMixin.colbert_linear", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ColBERTMixin.hidden_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ColBERTMixin.head_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 17, "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.colbert.ColBERTModernBertModel", "methods": [ { "kind": "function", "name": "ColBERTModernBertModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ColBERTModernBertModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColBERTModernBertModel.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ColBERTModernBertModel.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ColBERTModernBertModel.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ColBERTModernBertModel.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColBERTModernBertModel.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.colbert", "names": [ "vllm.model_executor.models.colbert.ColBERTJinaRobertaModel", "vllm.model_executor.models.colbert.ColBERTMixin", "vllm.model_executor.models.colbert.ColBERTModel", "vllm.model_executor.models.colbert.ColBERTModernBertModel" ], "n_typable": 55, "n_typed": 42, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 29, "n_classes": 4, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/colmodernvbert.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.colmodernvbert.ColModernVBertProcessingInfo", "methods": [ { "kind": "function", "name": "ColModernVBertProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ColModernVBertProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ColModernVBertProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ColModernVBertProcessingInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.colmodernvbert.ColModernVBertConnector", "methods": [ { "kind": "function", "name": "ColModernVBertConnector.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColModernVBertConnector.pixel_shuffle", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColModernVBertConnector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ColModernVBertConnector.pixel_shuffle_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertConnector.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.colmodernvbert.ColModernVBertMultiModalProcessor", "methods": [ { "kind": "function", "name": "ColModernVBertMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ColModernVBertMultiModalProcessor._hf_processor_applies_updates", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ColModernVBertMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ColModernVBertMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 17, "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.colmodernvbert.ColModernVBertDummyInputsBuilder", "methods": [ { "kind": "function", "name": "ColModernVBertDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColModernVBertDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.colmodernvbert.ColModernVBertForRetrieval", "methods": [ { "kind": "function", "name": "ColModernVBertForRetrieval.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ColModernVBertForRetrieval._get_image_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColModernVBertForRetrieval.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColModernVBertForRetrieval.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ColModernVBertForRetrieval.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ColModernVBertForRetrieval.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ColModernVBertForRetrieval.supports_late_interaction", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertForRetrieval.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertForRetrieval.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertForRetrieval.connector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertForRetrieval.text_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertForRetrieval.text_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertForRetrieval.text_final_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertForRetrieval.custom_text_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertForRetrieval.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertForRetrieval.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertForRetrieval._BASE_EMB", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ColModernVBertForRetrieval._EXTRA_EMB", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 24, "n_typed": 14, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 13, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.colmodernvbert", "names": [ "vllm.model_executor.models.colmodernvbert.ColModernVBertConnector", "vllm.model_executor.models.colmodernvbert.ColModernVBertDummyInputsBuilder", "vllm.model_executor.models.colmodernvbert.ColModernVBertForRetrieval", "vllm.model_executor.models.colmodernvbert.ColModernVBertMultiModalProcessor", "vllm.model_executor.models.colmodernvbert.ColModernVBertProcessingInfo" ], "n_typable": 61, "n_typed": 48, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 31, "n_classes": 5, "n_attrs": 15, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/colqwen3.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.colqwen3.ColQwen3ProcessingInfo", "methods": [ { "kind": "function", "name": "ColQwen3ProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ColQwen3ProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColQwen3ProcessingInfo.get_video_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColQwen3ProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ColQwen3ProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ColQwen3ProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "ColQwen3ProcessingInfo._supports_video", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 4, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.colqwen3.ColQwen3Model", "methods": [ { "kind": "function", "name": "ColQwen3Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ColQwen3Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ColQwen3Model._is_proj_weight", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ColQwen3Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ColQwen3Model.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ColQwen3Model.supports_late_interaction", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ColQwen3Model.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColQwen3Model.embed_dim", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ColQwen3Model.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColQwen3Model.custom_text_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColQwen3Model._PROJ_LAYER_NAMES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 18, "n_typed": 13, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.colqwen3", "names": [ "vllm.model_executor.models.colqwen3.ColQwen3Model", "vllm.model_executor.models.colqwen3.ColQwen3ProcessingInfo" ], "n_typable": 29, "n_typed": 21, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 13, "n_classes": 2, "n_attrs": 7, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/commandr.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.commandr.LayerNorm", "methods": [ { "kind": "function", "name": "LayerNorm.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LayerNorm.forward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LayerNorm.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LayerNorm.variance_epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.commandr.CohereDecoderLayer", "methods": [ { "kind": "function", "name": "CohereDecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CohereDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CohereDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.commandr.CohereForCausalLM", "methods": [ { "kind": "function", "name": "CohereForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CohereForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CohereForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CohereForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CohereForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CohereForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CohereForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CohereForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 13, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.commandr.layer_norm_func", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.models.commandr.CohereModel", "methods": [ { "kind": "function", "name": "CohereModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CohereModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CohereModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CohereModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CohereModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.commandr.CohereMLP", "methods": [ { "kind": "function", "name": "CohereMLP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CohereMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CohereMLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereMLP.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereMLP.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 3, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.commandr.CohereAttention", "methods": [ { "kind": "function", "name": "CohereAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CohereAttention._apply_qk_norm", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CohereAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CohereAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.use_qk_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.v1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CohereAttention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 7, "n_any": 0, "n_untyped": 25, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 21, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.commandr", "names": [ "vllm.model_executor.models.commandr.CohereAttention", "vllm.model_executor.models.commandr.CohereDecoderLayer", "vllm.model_executor.models.commandr.CohereForCausalLM", "vllm.model_executor.models.commandr.CohereMLP", "vllm.model_executor.models.commandr.CohereModel", "vllm.model_executor.models.commandr.LayerNorm", "vllm.model_executor.models.commandr.layer_norm_func" ], "n_typable": 106, "n_typed": 42, "n_any": 0, "n_untyped": 64, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 40, "n_classes": 6, "n_attrs": 46, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/config.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.config.JinaVLForSequenceClassificationConfig", "methods": [ { "kind": "function", "name": "JinaVLForSequenceClassificationConfig.verify_and_update_model_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.Qwen2ForProcessRewardModelConfig", "methods": [ { "kind": "function", "name": "Qwen2ForProcessRewardModelConfig.verify_and_update_model_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.Qwen3ForSequenceClassificationConfig", "methods": [ { "kind": "function", "name": "Qwen3ForSequenceClassificationConfig.verify_and_update_model_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.GteNewModelConfig", "methods": [ { "kind": "function", "name": "GteNewModelConfig.verify_and_update_model_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.MambaModelConfig", "methods": [ { "kind": "function", "name": "MambaModelConfig.verify_and_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.NomicBertModelConfig", "methods": [ { "kind": "function", "name": "NomicBertModelConfig.verify_and_update_model_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.Gemma3TextModelConfig", "methods": [ { "kind": "function", "name": "Gemma3TextModelConfig.verify_and_update_model_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.DeepseekV32ForCausalLM", "methods": [ { "kind": "function", "name": "DeepseekV32ForCausalLM.verify_and_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.JambaForSequenceClassificationConfig", "methods": [ { "kind": "function", "name": "JambaForSequenceClassificationConfig.verify_and_update_model_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.SnowflakeGteNewModelConfig", "methods": [ { "kind": "function", "name": "SnowflakeGteNewModelConfig.verify_and_update_model_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.GptOssForCausalLMConfig", "methods": [ { "kind": "function", "name": "GptOssForCausalLMConfig.verify_and_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.LlamaBidirectionalConfig", "methods": [ { "kind": "function", "name": "LlamaBidirectionalConfig.verify_and_update_model_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.HybridAttentionMambaModelConfig", "methods": [ { "kind": "function", "name": "HybridAttentionMambaModelConfig.verify_and_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.VoyageQwen3BidirectionalEmbedModelConfig", "methods": [ { "kind": "function", "name": "VoyageQwen3BidirectionalEmbedModelConfig.verify_and_update_model_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.NemotronHForCausalLMConfig", "methods": [ { "kind": "function", "name": "NemotronHForCausalLMConfig.verify_and_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.Qwen3_5ForConditionalGenerationConfig", "methods": [ { "kind": "function", "name": "Qwen3_5ForConditionalGenerationConfig.verify_and_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.Qwen2ForRewardModelConfig", "methods": [ { "kind": "function", "name": "Qwen2ForRewardModelConfig.verify_and_update_model_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.config.MODELS_CONFIG_MAP", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.config.JinaRobertaModelConfig", "methods": [ { "kind": "function", "name": "JinaRobertaModelConfig.verify_and_update_model_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.Qwen3VLForSequenceClassificationConfig", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.LlamaNemotronVLConfig", "methods": [ { "kind": "function", "name": "LlamaNemotronVLConfig.verify_and_update_model_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.Ernie4_5_VLMoeForConditionalGenerationConfig", "methods": [ { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGenerationConfig.verify_and_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.config.VerifyAndUpdateConfig", "methods": [ { "kind": "function", "name": "VerifyAndUpdateConfig.verify_and_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VerifyAndUpdateConfig.verify_and_update_model_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.config.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.config", "names": [ "vllm.model_executor.models.config.DeepseekV32ForCausalLM", "vllm.model_executor.models.config.Ernie4_5_VLMoeForConditionalGenerationConfig", "vllm.model_executor.models.config.Gemma3TextModelConfig", "vllm.model_executor.models.config.GptOssForCausalLMConfig", "vllm.model_executor.models.config.GteNewModelConfig", "vllm.model_executor.models.config.HybridAttentionMambaModelConfig", "vllm.model_executor.models.config.JambaForSequenceClassificationConfig", "vllm.model_executor.models.config.JinaRobertaModelConfig", "vllm.model_executor.models.config.JinaVLForSequenceClassificationConfig", "vllm.model_executor.models.config.LlamaBidirectionalConfig", "vllm.model_executor.models.config.LlamaNemotronVLConfig", "vllm.model_executor.models.config.MODELS_CONFIG_MAP", "vllm.model_executor.models.config.MambaModelConfig", "vllm.model_executor.models.config.NemotronHForCausalLMConfig", "vllm.model_executor.models.config.NomicBertModelConfig", "vllm.model_executor.models.config.Qwen2ForProcessRewardModelConfig", "vllm.model_executor.models.config.Qwen2ForRewardModelConfig", "vllm.model_executor.models.config.Qwen3ForSequenceClassificationConfig", "vllm.model_executor.models.config.Qwen3VLForSequenceClassificationConfig", "vllm.model_executor.models.config.Qwen3_5ForConditionalGenerationConfig", "vllm.model_executor.models.config.SnowflakeGteNewModelConfig", "vllm.model_executor.models.config.VerifyAndUpdateConfig", "vllm.model_executor.models.config.VoyageQwen3BidirectionalEmbedModelConfig", "vllm.model_executor.models.config.logger" ], "n_typable": 46, "n_typed": 45, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 22, "n_method_overloads": 22, "n_method_params": 22, "n_classes": 22, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/dbrx.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.dbrx.DbrxMoE", "methods": [ { "kind": "function", "name": "DbrxMoE.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DbrxMoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DbrxMoE.d_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxMoE.params_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxMoE.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxMoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dbrx.DbrxFusedNormAttention", "methods": [ { "kind": "function", "name": "DbrxFusedNormAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DbrxFusedNormAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DbrxFusedNormAttention.d_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxFusedNormAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxFusedNormAttention.norm_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxFusedNormAttention.norm_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dbrx.DbrxAttention", "methods": [ { "kind": "function", "name": "DbrxAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DbrxAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DbrxAttention.d_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxAttention.clip_qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxAttention.max_position", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxAttention.Wqkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 7, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 16, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dbrx.DbrxExperts", "methods": [ { "kind": "function", "name": "DbrxExperts.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DbrxExperts.weight_loader", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DbrxExperts.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxExperts.d_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxExperts.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dbrx.DbrxRouter", "methods": [ { "kind": "function", "name": "DbrxRouter.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DbrxRouter.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DbrxRouter.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxRouter.num_total_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxRouter.d_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxRouter.layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 4, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dbrx.DbrxModel", "methods": [ { "kind": "function", "name": "DbrxModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DbrxModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DbrxModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DbrxModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DbrxModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxModel.wte", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxModel.norm_f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dbrx.DbrxBlock", "methods": [ { "kind": "function", "name": "DbrxBlock.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DbrxBlock.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DbrxBlock.norm_attn_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxBlock.ffn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 7, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dbrx.DbrxForCausalLM", "methods": [ { "kind": "function", "name": "DbrxForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DbrxForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DbrxForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DbrxForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DbrxForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DbrxForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxForCausalLM.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DbrxForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.dbrx", "names": [ "vllm.model_executor.models.dbrx.DbrxAttention", "vllm.model_executor.models.dbrx.DbrxBlock", "vllm.model_executor.models.dbrx.DbrxExperts", "vllm.model_executor.models.dbrx.DbrxForCausalLM", "vllm.model_executor.models.dbrx.DbrxFusedNormAttention", "vllm.model_executor.models.dbrx.DbrxMoE", "vllm.model_executor.models.dbrx.DbrxModel", "vllm.model_executor.models.dbrx.DbrxRouter" ], "n_typable": 115, "n_typed": 63, "n_any": 0, "n_untyped": 52, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 51, "n_classes": 8, "n_attrs": 43, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/deepencoder.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.deepencoder.build_sam_vit_b", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.models.deepencoder.window_unpartition", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.deepencoder.MLPBlock", "methods": [ { "kind": "function", "name": "MLPBlock.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MLPBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MLPBlock.lin1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPBlock.lin2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPBlock.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 6, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.deepencoder.add_decomposed_rel_pos", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.deepencoder.RelPosAttention", "methods": [ { "kind": "function", "name": "RelPosAttention.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "RelPosAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RelPosAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RelPosAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RelPosAttention.qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RelPosAttention.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RelPosAttention.use_rel_pos", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RelPosAttention.rel_pos_h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RelPosAttention.rel_pos_w", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 9, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepencoder.DeepCLIPVisionEmbeddings", "methods": [ { "kind": "function", "name": "DeepCLIPVisionEmbeddings.get_abs_pos", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepCLIPVisionEmbeddings.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepencoder.LayerNorm2d", "methods": [ { "kind": "function", "name": "LayerNorm2d.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LayerNorm2d.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LayerNorm2d.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LayerNorm2d.bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LayerNorm2d.eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepencoder.DeepCLIPVisionTransformer", "methods": [ { "kind": "function", "name": "DeepCLIPVisionTransformer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepCLIPVisionTransformer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepCLIPVisionTransformer.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "DeepCLIPVisionTransformer.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "DeepCLIPVisionTransformer.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "DeepCLIPVisionTransformer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepCLIPVisionTransformer.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepCLIPVisionTransformer.pre_layrnorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepCLIPVisionTransformer.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 4, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.deepencoder.ImageEncoderViT", "methods": [ { "kind": "function", "name": "ImageEncoderViT.__init__", "n_typed": 18, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 }, { "kind": "function", "name": "ImageEncoderViT.get_abs_pos", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ImageEncoderViT.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ImageEncoderViT.img_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageEncoderViT.patch_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageEncoderViT.pos_embed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ImageEncoderViT.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageEncoderViT.neck", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageEncoderViT.net_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageEncoderViT.net_3", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 23, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 20, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepencoder.Block", "methods": [ { "kind": "function", "name": "Block.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "Block.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Block.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Block.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Block.norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Block.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Block.window_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 13, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.deepencoder.window_partition", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.deepencoder.PatchEmbed", "methods": [ { "kind": "function", "name": "PatchEmbed.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PatchEmbed.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PatchEmbed.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.deepencoder.get_rel_pos", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.models.deepencoder", "names": [ "vllm.model_executor.models.deepencoder.Block", "vllm.model_executor.models.deepencoder.DeepCLIPVisionEmbeddings", "vllm.model_executor.models.deepencoder.DeepCLIPVisionTransformer", "vllm.model_executor.models.deepencoder.ImageEncoderViT", "vllm.model_executor.models.deepencoder.LayerNorm2d", "vllm.model_executor.models.deepencoder.MLPBlock", "vllm.model_executor.models.deepencoder.PatchEmbed", "vllm.model_executor.models.deepencoder.RelPosAttention", "vllm.model_executor.models.deepencoder.add_decomposed_rel_pos", "vllm.model_executor.models.deepencoder.build_sam_vit_b", "vllm.model_executor.models.deepencoder.get_rel_pos", "vllm.model_executor.models.deepencoder.window_partition", "vllm.model_executor.models.deepencoder.window_unpartition" ], "n_typable": 132, "n_typed": 98, "n_any": 0, "n_untyped": 34, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 14, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 63, "n_classes": 8, "n_attrs": 30, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/deepencoder2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.deepencoder2.Qwen2Decoder2Encoder", "methods": [ { "kind": "function", "name": "Qwen2Decoder2Encoder.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen2Decoder2Encoder.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2Decoder2Encoder.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Decoder2Encoder.query_768", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Decoder2Encoder.query_1024", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.deepencoder2.build_qwen2_decoder_as_encoder", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.deepencoder2.CustomQwen2Decoder", "methods": [ { "kind": "function", "name": "CustomQwen2Decoder.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "CustomQwen2Decoder._create_custom_model", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CustomQwen2Decoder.forward", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CustomQwen2Decoder.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 16, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 19, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.deepencoder2", "names": [ "vllm.model_executor.models.deepencoder2.CustomQwen2Decoder", "vllm.model_executor.models.deepencoder2.Qwen2Decoder2Encoder", "vllm.model_executor.models.deepencoder2.build_qwen2_decoder_as_encoder" ], "n_typable": 40, "n_typed": 23, "n_any": 0, "n_untyped": 17, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 5, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 25, "n_classes": 2, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/deepseek_eagle.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.deepseek_eagle.EagleDeepseekV3ForCausalLM", "methods": [ { "kind": "function", "name": "EagleDeepseekV3ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EagleDeepseekV3ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EagleDeepseekV3ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EagleDeepseekV3ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EagleDeepseekV3ForCausalLM.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EagleDeepseekV3ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleDeepseekV3ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleDeepseekV3ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleDeepseekV3ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleDeepseekV3ForCausalLM.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 12, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_eagle.DeepseekV2Model", "methods": [ { "kind": "function", "name": "DeepseekV2Model.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepseekV2Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekV2Model.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepseekV2Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekV2Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Model.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Model.fc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Model.enorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Model.hnorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 12, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.deepseek_eagle", "names": [ "vllm.model_executor.models.deepseek_eagle.DeepseekV2Model", "vllm.model_executor.models.deepseek_eagle.EagleDeepseekV3ForCausalLM" ], "n_typable": 39, "n_typed": 24, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 17, "n_classes": 2, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/deepseek_mtp.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.deepseek_mtp.DeepSeekMultiTokenPredictor", "methods": [ { "kind": "function", "name": "DeepSeekMultiTokenPredictor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepSeekMultiTokenPredictor.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepSeekMultiTokenPredictor.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DeepSeekMultiTokenPredictor.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepSeekMultiTokenPredictor.mtp_start_layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekMultiTokenPredictor.num_mtp_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekMultiTokenPredictor.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekMultiTokenPredictor.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekMultiTokenPredictor.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 13, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_mtp.SharedHead", "methods": [ { "kind": "function", "name": "SharedHead.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SharedHead.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SharedHead.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SharedHead.head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_mtp.DeepSeekMultiTokenPredictorLayer", "methods": [ { "kind": "function", "name": "DeepSeekMultiTokenPredictorLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepSeekMultiTokenPredictorLayer.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepSeekMultiTokenPredictorLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekMultiTokenPredictorLayer.enorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekMultiTokenPredictorLayer.hnorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekMultiTokenPredictorLayer.eh_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekMultiTokenPredictorLayer.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekMultiTokenPredictorLayer.is_v32", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekMultiTokenPredictorLayer.shared_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekMultiTokenPredictorLayer.mtp_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 9, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.deepseek_mtp.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_mtp.DeepSeekMTP", "methods": [ { "kind": "function", "name": "DeepSeekMTP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepSeekMTP.set_moe_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepSeekMTP.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepSeekMTP.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "DeepSeekMTP.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepSeekMTP.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepSeekMTP._rewrite_spec_layer_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepSeekMTP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekMTP.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 19, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 14, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.deepseek_mtp", "names": [ "vllm.model_executor.models.deepseek_mtp.DeepSeekMTP", "vllm.model_executor.models.deepseek_mtp.DeepSeekMultiTokenPredictor", "vllm.model_executor.models.deepseek_mtp.DeepSeekMultiTokenPredictorLayer", "vllm.model_executor.models.deepseek_mtp.SharedHead", "vllm.model_executor.models.deepseek_mtp.logger" ], "n_typable": 68, "n_typed": 47, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 35, "n_classes": 4, "n_attrs": 18, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/deepseek_ocr.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.deepseek_ocr.DeepseekOCRProcessingInfo", "methods": [ { "kind": "function", "name": "DeepseekOCRProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepseekOCRProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCRProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepseekOCRProcessingInfo.get_num_image_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepseekOCRProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_ocr.DeepseekOCRImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekOCRImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRImagePixelInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRImagePixelInputs.images_crop", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRImagePixelInputs.images_spatial_crop", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_ocr.DeepseekOCRForCausalLM", "methods": [ { "kind": "function", "name": "DeepseekOCRForCausalLM.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekOCRForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekOCRForCausalLM._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCRForCausalLM._encode_global_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCRForCausalLM._encode_local_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekOCRForCausalLM._pixel_values_to_embedding", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepseekOCRForCausalLM._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCRForCausalLM.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCRForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DeepseekOCRForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCRForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCRForCausalLM.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekOCRForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRForCausalLM.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRForCausalLM.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRForCausalLM.projector_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRForCausalLM.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRForCausalLM.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRForCausalLM.sam_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRForCausalLM.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRForCausalLM.projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRForCausalLM.tile_tag", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRForCausalLM.global_view_pos", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRForCausalLM.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRForCausalLM.image_newline", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRForCausalLM.view_seperator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 48, "n_typed": 30, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 20, "n_attrs": 16, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_ocr.NGramPerReqLogitsProcessor", "methods": [ { "kind": "function", "name": "NGramPerReqLogitsProcessor.validate_params", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NGramPerReqLogitsProcessor.is_argmax_invariant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NGramPerReqLogitsProcessor.new_req_logits_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_ocr.NoRepeatNGramLogitsProcessor", "methods": [ { "kind": "function", "name": "NoRepeatNGramLogitsProcessor.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "NoRepeatNGramLogitsProcessor.__call__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NoRepeatNGramLogitsProcessor.ngram_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NoRepeatNGramLogitsProcessor.window_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NoRepeatNGramLogitsProcessor.whitelist_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_ocr.DeepseekOCRDummyInputsBuilder", "methods": [ { "kind": "function", "name": "DeepseekOCRDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCRDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_ocr.DeepseekOCRMultiModalProcessor", "methods": [ { "kind": "function", "name": "DeepseekOCRMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepseekOCRMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekOCRMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.deepseek_ocr.IMAGE_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.deepseek_ocr", "names": [ "vllm.model_executor.models.deepseek_ocr.DeepseekOCRDummyInputsBuilder", "vllm.model_executor.models.deepseek_ocr.DeepseekOCRForCausalLM", "vllm.model_executor.models.deepseek_ocr.DeepseekOCRImagePixelInputs", "vllm.model_executor.models.deepseek_ocr.DeepseekOCRMultiModalProcessor", "vllm.model_executor.models.deepseek_ocr.DeepseekOCRProcessingInfo", "vllm.model_executor.models.deepseek_ocr.IMAGE_SIZE", "vllm.model_executor.models.deepseek_ocr.NGramPerReqLogitsProcessor", "vllm.model_executor.models.deepseek_ocr.NoRepeatNGramLogitsProcessor" ], "n_typable": 94, "n_typed": 69, "n_any": 0, "n_untyped": 25, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 27, "n_method_overloads": 27, "n_method_params": 44, "n_classes": 7, "n_attrs": 24, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/deepseek_ocr2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.deepseek_ocr2.DeepseekOCR2ForCausalLM", "methods": [ { "kind": "function", "name": "DeepseekOCR2ForCausalLM.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekOCR2ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekOCR2ForCausalLM._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCR2ForCausalLM._encode_global_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCR2ForCausalLM._encode_local_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCR2ForCausalLM._pixel_values_to_embedding", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepseekOCR2ForCausalLM._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCR2ForCausalLM.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCR2ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DeepseekOCR2ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCR2ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCR2ForCausalLM.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekOCR2ForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCR2ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCR2ForCausalLM.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCR2ForCausalLM.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCR2ForCausalLM.projector_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCR2ForCausalLM.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCR2ForCausalLM.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCR2ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCR2ForCausalLM.sam_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCR2ForCausalLM.qwen2_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCR2ForCausalLM.projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCR2ForCausalLM.tile_tag", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCR2ForCausalLM.global_view_pos", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCR2ForCausalLM.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCR2ForCausalLM.view_seperator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 46, "n_typed": 29, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 19, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_ocr2.DeepseekOCR2DummyInputsBuilder", "methods": [ { "kind": "function", "name": "DeepseekOCR2DummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCR2DummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_ocr2.DeepseekOCR2ProcessingInfo", "methods": [ { "kind": "function", "name": "DeepseekOCR2ProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepseekOCR2ProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekOCR2ProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepseekOCR2ProcessingInfo.get_num_image_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepseekOCR2ProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_ocr2.DeepseekOCR2MultiModalProcessor", "methods": [ { "kind": "function", "name": "DeepseekOCR2MultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepseekOCR2MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekOCR2MultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.deepseek_ocr2.IMAGE_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.deepseek_ocr2", "names": [ "vllm.model_executor.models.deepseek_ocr2.DeepseekOCR2DummyInputsBuilder", "vllm.model_executor.models.deepseek_ocr2.DeepseekOCR2ForCausalLM", "vllm.model_executor.models.deepseek_ocr2.DeepseekOCR2MultiModalProcessor", "vllm.model_executor.models.deepseek_ocr2.DeepseekOCR2ProcessingInfo", "vllm.model_executor.models.deepseek_ocr2.IMAGE_SIZE" ], "n_typable": 73, "n_typed": 54, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 22, "n_method_overloads": 22, "n_method_params": 36, "n_classes": 4, "n_attrs": 16, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/deepseek_v2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.deepseek_v2.DeepseekAttention", "methods": [ { "kind": "function", "name": "DeepseekAttention.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "DeepseekAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 12, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 14, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.deepseek_v2.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_v2.DeepseekV32IndexerCache", "methods": [ { "kind": "function", "name": "DeepseekV32IndexerCache.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepseekV32IndexerCache.get_kv_cache_spec", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekV32IndexerCache.forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepseekV32IndexerCache.get_attn_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekV32IndexerCache.kv_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV32IndexerCache.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV32IndexerCache.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV32IndexerCache.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV32IndexerCache.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 7, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_v2.DeepseekV2DecoderLayer", "methods": [ { "kind": "function", "name": "DeepseekV2DecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepseekV2DecoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekV2DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2DecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2DecoderLayer.use_mha", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2DecoderLayer.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 10, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 8, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.deepseek_v2.get_spec_layer_idx_from_weight_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_v2.DeepseekV2MLAAttention", "methods": [ { "kind": "function", "name": "DeepseekV2MLAAttention.__init__", "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "DeepseekV2MLAAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekV2MLAAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.qk_nope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.qk_rope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.qk_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.kv_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.num_local_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.kv_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.kv_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.is_v32", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.mla_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.fused_qkv_a_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.q_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.q_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.indexer_rope_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.indexer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.kv_a_proj_with_mqa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLAAttention.q_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 43, "n_typed": 19, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 17, "n_attrs": 24, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_v2.DeepSeekV2FusedQkvAProj", "methods": [ { "kind": "function", "name": "DeepSeekV2FusedQkvAProj.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepSeekV2FusedQkvAProj.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_v2.DeepseekV2MLP", "methods": [ { "kind": "function", "name": "DeepseekV2MLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "DeepseekV2MLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekV2MLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 7, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_v2.DeepseekV2Model", "methods": [ { "kind": "function", "name": "DeepseekV2Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekV2Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekV2Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekV2Model.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV2Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Model.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Model.is_v32", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 9, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_v2.DeepseekV2ForCausalLM", "methods": [ { "kind": "function", "name": "DeepseekV2ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekV2ForCausalLM.set_moe_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepseekV2ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekV2ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepseekV2ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekV2ForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepseekV2ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekV2ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV2ForCausalLM.model_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV2ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2ForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2ForCausalLM.use_mha", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2ForCausalLM.fuse_qkv_a_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2ForCausalLM.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 14, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 9, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_v2.DeepseekV2MoE", "methods": [ { "kind": "function", "name": "DeepseekV2MoE.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepseekV2MoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekV2MoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.n_routed_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.n_shared_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.is_sequence_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.is_rocm_aiter_moe_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.is_fusion_moe_shared_experts_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2MoE.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 8, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 21, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_v2.DeepseekV2Attention", "methods": [ { "kind": "function", "name": "DeepseekV2Attention.__init__", "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "DeepseekV2Attention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekV2Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.qk_nope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.qk_rope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.qk_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.kv_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.num_local_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.kv_a_proj_with_mqa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.kv_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.kv_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.q_a_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.q_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.q_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV2Attention.q_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 19, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 17, "n_attrs": 21, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_v2.DeepseekForCausalLM", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_v2.Indexer", "methods": [ { "kind": "function", "name": "Indexer.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "Indexer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Indexer.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.topk_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.n_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.rope_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.wq_b", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.wk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.weights_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.softmax_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.scale_fmt", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.quant_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.topk_indices_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.k_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.max_total_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Indexer.indexer_op", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 11, "n_any": 0, "n_untyped": 23, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_attrs": 20, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_v2.DeepseekV2MixtureOfExperts", "methods": [ { "kind": "function", "name": "DeepseekV2MixtureOfExperts.extract_moe_parameters", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekV2MixtureOfExperts.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekV2MixtureOfExperts.moe_mlp_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.deepseek_v2.yarn_get_mscale", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_v2.DeepseekV3ForCausalLM", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_v2.GlmMoeDsaForCausalLM", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.deepseek_v2", "names": [ "vllm.model_executor.models.deepseek_v2.DeepSeekV2FusedQkvAProj", "vllm.model_executor.models.deepseek_v2.DeepseekAttention", "vllm.model_executor.models.deepseek_v2.DeepseekForCausalLM", "vllm.model_executor.models.deepseek_v2.DeepseekV2Attention", "vllm.model_executor.models.deepseek_v2.DeepseekV2DecoderLayer", "vllm.model_executor.models.deepseek_v2.DeepseekV2ForCausalLM", "vllm.model_executor.models.deepseek_v2.DeepseekV2MLAAttention", "vllm.model_executor.models.deepseek_v2.DeepseekV2MLP", "vllm.model_executor.models.deepseek_v2.DeepseekV2MixtureOfExperts", "vllm.model_executor.models.deepseek_v2.DeepseekV2MoE", "vllm.model_executor.models.deepseek_v2.DeepseekV2Model", "vllm.model_executor.models.deepseek_v2.DeepseekV32IndexerCache", "vllm.model_executor.models.deepseek_v2.DeepseekV3ForCausalLM", "vllm.model_executor.models.deepseek_v2.GlmMoeDsaForCausalLM", "vllm.model_executor.models.deepseek_v2.Indexer", "vllm.model_executor.models.deepseek_v2.get_spec_layer_idx_from_weight_name", "vllm.model_executor.models.deepseek_v2.logger", "vllm.model_executor.models.deepseek_v2.yarn_get_mscale" ], "n_typable": 279, "n_typed": 132, "n_any": 0, "n_untyped": 147, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 4, "n_methods": 32, "n_method_overloads": 32, "n_method_params": 107, "n_classes": 15, "n_attrs": 137, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/deepseek_vl2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.deepseek_vl2.MlpProjector", "methods": [ { "kind": "function", "name": "MlpProjector.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MlpProjector.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MlpProjector.cfg", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MlpProjector.projector_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MlpProjector.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 1, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_vl2.DeepseekVL2ImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekVL2ImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVL2ImagePixelInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVL2ImagePixelInputs.images_spatial_crop", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_vl2.DeepseekVL2MultiModalProcessor", "methods": [ { "kind": "function", "name": "DeepseekVL2MultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepseekVL2MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekVL2MultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepseekVL2MultiModalProcessor._cached_apply_hf_processor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 15, "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.deepseek_vl2.DeepseekVL2ImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_vl2.DeepseekVL2VImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekVL2VImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVL2VImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_vl2.DeepseekVL2DummyInputsBuilder", "methods": [ { "kind": "function", "name": "DeepseekVL2DummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekVL2DummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_vl2.DeepseekVLV2ForCausalLM", "methods": [ { "kind": "function", "name": "DeepseekVLV2ForCausalLM.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekVLV2ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekVLV2ForCausalLM._get_parent_and_attr", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekVLV2ForCausalLM.patch_vit_for_tp", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekVLV2ForCausalLM._init_vision_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepseekVLV2ForCausalLM._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekVLV2ForCausalLM._pixel_values_to_embedding", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekVLV2ForCausalLM._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekVLV2ForCausalLM.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekVLV2ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DeepseekVLV2ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekVLV2ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekVLV2ForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2ForCausalLM.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2ForCausalLM.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2ForCausalLM.projector_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2ForCausalLM.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2ForCausalLM.image_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2ForCausalLM.vision", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2ForCausalLM.projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2ForCausalLM.tile_tag", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2ForCausalLM.global_view_pos", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2ForCausalLM.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2ForCausalLM.image_newline", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2ForCausalLM.view_seperator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 50, "n_typed": 32, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 23, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.deepseek_vl2.DeepseekVL2ProcessingInfo", "methods": [ { "kind": "function", "name": "DeepseekVL2ProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepseekVL2ProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekVL2ProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepseekVL2ProcessingInfo.get_num_image_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepseekVL2ProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.deepseek_vl2", "names": [ "vllm.model_executor.models.deepseek_vl2.DeepseekVL2DummyInputsBuilder", "vllm.model_executor.models.deepseek_vl2.DeepseekVL2ImageInputs", "vllm.model_executor.models.deepseek_vl2.DeepseekVL2ImagePixelInputs", "vllm.model_executor.models.deepseek_vl2.DeepseekVL2MultiModalProcessor", "vllm.model_executor.models.deepseek_vl2.DeepseekVL2ProcessingInfo", "vllm.model_executor.models.deepseek_vl2.DeepseekVL2VImageEmbeddingInputs", "vllm.model_executor.models.deepseek_vl2.DeepseekVLV2ForCausalLM", "vllm.model_executor.models.deepseek_vl2.MlpProjector" ], "n_typable": 93, "n_typed": 67, "n_any": 0, "n_untyped": 26, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 25, "n_method_overloads": 25, "n_method_params": 44, "n_classes": 7, "n_attrs": 24, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/dots1.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.dots1.Dots1Model", "methods": [ { "kind": "function", "name": "Dots1Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Dots1Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Dots1Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Dots1Model.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Dots1Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Dots1Model.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Dots1Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 12, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dots1.Dots1Attention", "methods": [ { "kind": "function", "name": "Dots1Attention.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "Dots1Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Dots1Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Attention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Attention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1Attention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 12, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 16, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dots1.Dots1MoE", "methods": [ { "kind": "function", "name": "Dots1MoE.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Dots1MoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Dots1MoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1MoE.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1MoE.n_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1MoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1MoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1MoE.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 5, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dots1.Dots1ForCausalLM", "methods": [ { "kind": "function", "name": "Dots1ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Dots1ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Dots1ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Dots1ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Dots1ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Dots1ForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Dots1ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Dots1ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1ForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 14, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dots1.Dots1DecoderLayer", "methods": [ { "kind": "function", "name": "Dots1DecoderLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Dots1DecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Dots1DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1DecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1DecoderLayer.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 10, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dots1.Dots1MLP", "methods": [ { "kind": "function", "name": "Dots1MLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Dots1MLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Dots1MLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1MLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Dots1MLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.dots1", "names": [ "vllm.model_executor.models.dots1.Dots1Attention", "vllm.model_executor.models.dots1.Dots1DecoderLayer", "vllm.model_executor.models.dots1.Dots1ForCausalLM", "vllm.model_executor.models.dots1.Dots1MLP", "vllm.model_executor.models.dots1.Dots1MoE", "vllm.model_executor.models.dots1.Dots1Model" ], "n_typable": 108, "n_typed": 60, "n_any": 0, "n_untyped": 48, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 46, "n_classes": 6, "n_attrs": 45, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/dots_ocr.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.dots_ocr.DotsVisionTransformer", "methods": [ { "kind": "function", "name": "DotsVisionTransformer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DotsVisionTransformer.get_pos_ids_by_grid", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DotsVisionTransformer.rot_pos_emb", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DotsVisionTransformer.compute_attn_mask_seqlen", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DotsVisionTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "DotsVisionTransformer.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "DotsVisionTransformer.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "DotsVisionTransformer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionTransformer.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionTransformer.patch_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionTransformer.rotary_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionTransformer.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionTransformer.out_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionTransformer.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionTransformer.merger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionTransformer.post_trunk_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 17, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 9, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.dots_ocr.DotsVisionBlock", "methods": [ { "kind": "function", "name": "DotsVisionBlock.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DotsVisionBlock.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DotsVisionBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionBlock.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionBlock.norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 7, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dots_ocr.DotsOCRImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DotsOCRImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DotsOCRImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DotsOCRImagePixelInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dots_ocr.PatchMerger", "methods": [ { "kind": "function", "name": "PatchMerger.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PatchMerger.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PatchMerger.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PatchMerger.pre_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PatchMerger.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PatchMerger.ln_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dots_ocr.DotsOCRForCausalLM", "methods": [ { "kind": "function", "name": "DotsOCRForCausalLM.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DotsOCRForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DotsOCRForCausalLM._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DotsOCRForCausalLM._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DotsOCRForCausalLM.get_num_mm_encoder_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DotsOCRForCausalLM.get_num_mm_connector_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DotsOCRForCausalLM.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DotsOCRForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DotsOCRForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DotsOCRForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DotsOCRForCausalLM.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DotsOCRForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsOCRForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DotsOCRForCausalLM.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DotsOCRForCausalLM.config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DotsOCRForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsOCRForCausalLM.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsOCRForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsOCRForCausalLM.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsOCRForCausalLM.language_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 34, "n_typed": 27, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 16, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dots_ocr.DotsPatchEmbed", "methods": [ { "kind": "function", "name": "DotsPatchEmbed.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DotsPatchEmbed.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DotsPatchEmbed.num_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsPatchEmbed.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsPatchEmbed.temporal_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsPatchEmbed.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsPatchEmbed.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsPatchEmbed.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsPatchEmbed.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 2, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.dots_ocr.DotsOCRImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.dots_ocr.DotsSwiGLUFFN", "methods": [ { "kind": "function", "name": "DotsSwiGLUFFN.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DotsSwiGLUFFN.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DotsSwiGLUFFN.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DotsSwiGLUFFN.fc13", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsSwiGLUFFN.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsSwiGLUFFN.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dots_ocr.DotsOCRProcessingInfo", "methods": [ { "kind": "function", "name": "DotsOCRProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DotsOCRProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DotsOCRProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DotsOCRProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.dots_ocr.IMAGE_TOKEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dots_ocr.DotsOCRImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DotsOCRImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DotsOCRImageEmbeddingInputs.image_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DotsOCRImageEmbeddingInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dots_ocr.DotsOCRDummyInputsBuilder", "methods": [ { "kind": "function", "name": "DotsOCRDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DotsOCRDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dots_ocr.VisionRotaryEmbedding", "methods": [ { "kind": "function", "name": "VisionRotaryEmbedding.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VisionRotaryEmbedding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dots_ocr.DotsViTPreprocessor", "methods": [ { "kind": "function", "name": "DotsViTPreprocessor.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DotsViTPreprocessor.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DotsViTPreprocessor.patch_h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsViTPreprocessor.patch_w", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsViTPreprocessor.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsViTPreprocessor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsViTPreprocessor.patchifier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 2, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.dots_ocr.DotsVisionAttention", "methods": [ { "kind": "function", "name": "DotsVisionAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "DotsVisionAttention.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DotsVisionAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionAttention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionAttention.hidden_size_per_attention_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionAttention.num_attention_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionAttention.qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionAttention.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionAttention.apply_rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 11, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.dots_ocr", "names": [ "vllm.model_executor.models.dots_ocr.DotsOCRDummyInputsBuilder", "vllm.model_executor.models.dots_ocr.DotsOCRForCausalLM", "vllm.model_executor.models.dots_ocr.DotsOCRImageEmbeddingInputs", "vllm.model_executor.models.dots_ocr.DotsOCRImageInputs", "vllm.model_executor.models.dots_ocr.DotsOCRImagePixelInputs", "vllm.model_executor.models.dots_ocr.DotsOCRProcessingInfo", "vllm.model_executor.models.dots_ocr.DotsPatchEmbed", "vllm.model_executor.models.dots_ocr.DotsSwiGLUFFN", "vllm.model_executor.models.dots_ocr.DotsViTPreprocessor", "vllm.model_executor.models.dots_ocr.DotsVisionAttention", "vllm.model_executor.models.dots_ocr.DotsVisionBlock", "vllm.model_executor.models.dots_ocr.DotsVisionTransformer", "vllm.model_executor.models.dots_ocr.IMAGE_TOKEN", "vllm.model_executor.models.dots_ocr.PatchMerger", "vllm.model_executor.models.dots_ocr.VisionRotaryEmbedding" ], "n_typable": 164, "n_typed": 104, "n_any": 0, "n_untyped": 60, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 37, "n_method_overloads": 37, "n_method_params": 70, "n_classes": 13, "n_attrs": 58, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/eagle2_5_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLProcessingInfo", "methods": [ { "kind": "function", "name": "Eagle2_5_VLProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLProcessor", "methods": [ { "kind": "function", "name": "Eagle2_5_VLProcessor.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Eagle2_5_VLProcessor.get_image_repl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "Eagle2_5_VLProcessor.image_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Eagle2_5_VLProcessor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLProcessor.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLProcessor.num_image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLProcessor.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLProcessor.min_dynamic_patch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLProcessor.max_dynamic_patch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLProcessor.dynamic_image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLProcessor.use_thumbnail", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 8, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Eagle2_5_VLImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLImagePixelInputs.pixel_values_flat", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLImagePixelInputs.num_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLDummyInputsBuilder", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLMultiModalProcessor", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Eagle2_5_VLImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLForConditionalGeneration", "methods": [ { "kind": "function", "name": "Eagle2_5_VLForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Eagle2_5_VLForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Eagle2_5_VLForConditionalGeneration._init_vision_model", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Eagle2_5_VLForConditionalGeneration._init_mlp1", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Eagle2_5_VLForConditionalGeneration.pixel_shuffle", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Eagle2_5_VLForConditionalGeneration.extract_feature", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Eagle2_5_VLForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Eagle2_5_VLForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Eagle2_5_VLForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Eagle2_5_VLForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Eagle2_5_VLForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Eagle2_5_VLForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Eagle2_5_VLForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Eagle2_5_VLForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Eagle2_5_VLForConditionalGeneration.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Eagle2_5_VLForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLForConditionalGeneration.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLForConditionalGeneration.downsample_ratio", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLForConditionalGeneration.num_image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLForConditionalGeneration.select_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLForConditionalGeneration.img_context_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLForConditionalGeneration.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLForConditionalGeneration.mlp1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle2_5_VLForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 51, "n_typed": 38, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 25, "n_attrs": 13, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.eagle2_5_vl", "names": [ "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLDummyInputsBuilder", "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLForConditionalGeneration", "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLImageEmbeddingInputs", "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLImageInputs", "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLImagePixelInputs", "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLMultiModalProcessor", "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLProcessingInfo", "vllm.model_executor.models.eagle2_5_vl.Eagle2_5_VLProcessor" ], "n_typable": 77, "n_typed": 56, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 33, "n_classes": 7, "n_attrs": 27, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/ernie45.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.ernie45.Ernie4_5ForCausalLM", "methods": [ { "kind": "function", "name": "Ernie4_5ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.ernie45", "names": [ "vllm.model_executor.models.ernie45.Ernie4_5ForCausalLM" ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/ernie45_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.ernie45_moe.Ernie4_5_MoeModel", "methods": [ { "kind": "function", "name": "Ernie4_5_MoeModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ernie4_5_MoeModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_MoeModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Ernie4_5_MoeModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Ernie4_5_MoeModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_MoeModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeModel.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 12, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_moe.Ernie4_5_MoeDecoderLayer", "methods": [ { "kind": "function", "name": "Ernie4_5_MoeDecoderLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Ernie4_5_MoeDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_MoeDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeDecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 10, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_moe.Ernie4_5_MoeForCausalLM", "methods": [ { "kind": "function", "name": "Ernie4_5_MoeForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ernie4_5_MoeForCausalLM.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ernie4_5_MoeForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_MoeForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Ernie4_5_MoeForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_MoeForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_MoeForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.expert_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.num_expert_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.moe_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.num_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.num_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.num_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.num_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.num_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeForCausalLM.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 18, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 11, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_moe.Ernie4_5_MoeAttention", "methods": [ { "kind": "function", "name": "Ernie4_5_MoeAttention.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "Ernie4_5_MoeAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_MoeAttention.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 15, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 13, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_moe.Ernie4_5_MoeMoE", "methods": [ { "kind": "function", "name": "Ernie4_5_MoeMoE.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Ernie4_5_MoeMoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_MoeMoE.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.moe_num_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.n_routed_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.n_shared_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.has_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMoE.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 8, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 19, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_moe.Ernie4_5_MoeMLP", "methods": [ { "kind": "function", "name": "Ernie4_5_MoeMLP.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Ernie4_5_MoeMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_MoeMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_MoeMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.ernie45_moe.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.ernie45_moe", "names": [ "vllm.model_executor.models.ernie45_moe.Ernie4_5_MoeAttention", "vllm.model_executor.models.ernie45_moe.Ernie4_5_MoeDecoderLayer", "vllm.model_executor.models.ernie45_moe.Ernie4_5_MoeForCausalLM", "vllm.model_executor.models.ernie45_moe.Ernie4_5_MoeMLP", "vllm.model_executor.models.ernie45_moe.Ernie4_5_MoeMoE", "vllm.model_executor.models.ernie45_moe.Ernie4_5_MoeModel", "vllm.model_executor.models.ernie45_moe.logger" ], "n_typable": 139, "n_typed": 71, "n_any": 0, "n_untyped": 68, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 20, "n_method_overloads": 20, "n_method_params": 53, "n_classes": 6, "n_attrs": 68, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/ernie45_vl.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.ernie45_vl.smart_resize", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl.Ernie4_5_VLDummyInputsBuilder", "methods": [ { "kind": "function", "name": "Ernie4_5_VLDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VLDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Ernie4_5_VLDummyInputsBuilder._get_dummy_videos", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.ernie45_vl.floor_by_factor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl.Ernie4_5_VisionTransformer", "methods": [ { "kind": "function", "name": "Ernie4_5_VisionTransformer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Ernie4_5_VisionTransformer.rot_pos_emb", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VisionTransformer.compute_attn_mask_seqlen", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VisionTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Ernie4_5_VisionTransformer.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Ernie4_5_VisionTransformer.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Ernie4_5_VisionTransformer.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Ernie4_5_VisionTransformer.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionTransformer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionTransformer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionTransformer.patch_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionTransformer.rotary_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionTransformer.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionTransformer.ln", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionTransformer.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 14, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 8, "n_properties": 2 }, { "kind": "function", "name": "vllm.model_executor.models.ernie45_vl.ceil_by_factor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.ernie45_vl.all_gather_interleave", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl.Ernie4_5_VLMoeForConditionalGeneration", "methods": [ { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGeneration._vision_forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGeneration._set_visual_token_mask", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGeneration.get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGeneration._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGeneration._process_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGeneration._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGeneration.forward", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Ernie4_5_VLMoeForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_VLMoeForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Ernie4_5_VLMoeForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeForConditionalGeneration.visual_token_mask", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeForConditionalGeneration.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeForConditionalGeneration.resampler_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 49, "n_typed": 39, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 26, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl.Ernie4_5VLMultiModalProcessor", "methods": [ { "kind": "function", "name": "Ernie4_5VLMultiModalProcessor._pixel_values_norm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ernie4_5VLMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Ernie4_5VLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Ernie4_5VLMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 15, "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl.Ernie4_5_VisionRotaryEmbedding", "methods": [ { "kind": "function", "name": "Ernie4_5_VisionRotaryEmbedding.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ernie4_5_VisionRotaryEmbedding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_VisionRotaryEmbedding.inv_freq", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl.Ernie4_5_VisionBlock", "methods": [ { "kind": "function", "name": "Ernie4_5_VisionBlock.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Ernie4_5_VisionBlock.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_VisionBlock.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionBlock.norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 13, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl.Ernie4_5_VLProcessingInfo", "methods": [ { "kind": "function", "name": "Ernie4_5_VLProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Ernie4_5_VLProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VLProcessingInfo.get_image_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VLProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Ernie4_5_VLProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Ernie4_5_VLProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ernie4_5_VLProcessingInfo._get_vision_info", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Ernie4_5_VLProcessingInfo.get_num_image_tokens", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Ernie4_5_VLProcessingInfo.get_num_video_tokens", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Ernie4_5_VLProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Ernie4_5_VLProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Ernie4_5_VLProcessingInfo._get_max_video_frames", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VLProcessingInfo.get_num_frames_with_most_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ernie4_5_VLProcessingInfo.get_max_video_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 38, "n_typed": 34, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 24, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.ernie45_vl.round_by_factor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl.Ernie4_5_VLVideoPixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_VLVideoPixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLVideoPixelInputs.pixel_values_videos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLVideoPixelInputs.video_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl.VariableResolutionResamplerModel", "methods": [ { "kind": "function", "name": "VariableResolutionResamplerModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "VariableResolutionResamplerModel.spatial_conv_reshape", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VariableResolutionResamplerModel.forward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VariableResolutionResamplerModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VariableResolutionResamplerModel.in_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.out_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.spatial_conv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.temporal_conv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.use_temporal_conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.spatial_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.temporal_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.spatial_linear1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.spatial_gelu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.spatial_linear2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.spatial_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.after_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.temporal_linear1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.temporal_gelu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.temporal_linear2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VariableResolutionResamplerModel.temporal_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 4, "n_any": 0, "n_untyped": 29, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl.Ernie4_5_VLImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_VLImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLImagePixelInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl.Ernie4_5_VisionMLP", "methods": [ { "kind": "function", "name": "Ernie4_5_VisionMLP.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Ernie4_5_VisionMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_VisionMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl.Ernie4_5_VisionAttention", "methods": [ { "kind": "function", "name": "Ernie4_5_VisionAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Ernie4_5_VisionAttention.split_qkv", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VisionAttention.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_VisionAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionAttention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionAttention.hidden_size_per_attention_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionAttention.num_attention_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionAttention.qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionAttention.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionAttention.apply_rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 13, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl.Ernie4_5_VisionPatchEmbed", "methods": [ { "kind": "function", "name": "Ernie4_5_VisionPatchEmbed.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Ernie4_5_VisionPatchEmbed.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_VisionPatchEmbed.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionPatchEmbed.in_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionPatchEmbed.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VisionPatchEmbed.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.ernie45_vl.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.ernie45_vl", "names": [ "vllm.model_executor.models.ernie45_vl.Ernie4_5VLMultiModalProcessor", "vllm.model_executor.models.ernie45_vl.Ernie4_5_VLDummyInputsBuilder", "vllm.model_executor.models.ernie45_vl.Ernie4_5_VLImagePixelInputs", "vllm.model_executor.models.ernie45_vl.Ernie4_5_VLMoeForConditionalGeneration", "vllm.model_executor.models.ernie45_vl.Ernie4_5_VLProcessingInfo", "vllm.model_executor.models.ernie45_vl.Ernie4_5_VLVideoPixelInputs", "vllm.model_executor.models.ernie45_vl.Ernie4_5_VisionAttention", "vllm.model_executor.models.ernie45_vl.Ernie4_5_VisionBlock", "vllm.model_executor.models.ernie45_vl.Ernie4_5_VisionMLP", "vllm.model_executor.models.ernie45_vl.Ernie4_5_VisionPatchEmbed", "vllm.model_executor.models.ernie45_vl.Ernie4_5_VisionRotaryEmbedding", "vllm.model_executor.models.ernie45_vl.Ernie4_5_VisionTransformer", "vllm.model_executor.models.ernie45_vl.VariableResolutionResamplerModel", "vllm.model_executor.models.ernie45_vl.all_gather_interleave", "vllm.model_executor.models.ernie45_vl.ceil_by_factor", "vllm.model_executor.models.ernie45_vl.floor_by_factor", "vllm.model_executor.models.ernie45_vl.logger", "vllm.model_executor.models.ernie45_vl.round_by_factor", "vllm.model_executor.models.ernie45_vl.smart_resize" ], "n_typable": 264, "n_typed": 183, "n_any": 0, "n_untyped": 81, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 14, "n_methods": 56, "n_method_overloads": 56, "n_method_params": 126, "n_classes": 13, "n_attrs": 62, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/ernie45_vl_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl_moe.Ernie4_5_VLMoeMoE", "methods": [ { "kind": "function", "name": "Ernie4_5_VLMoeMoE.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Ernie4_5_VLMoeMoE.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_VLMoeMoE.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeMoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeMoE.has_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeMoE.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeMoE.e_score_correction_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeMoE.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeMoE.text_experts_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeMoE.text_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeMoE.vision_experts_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeMoE.vision_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 7, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl_moe.Ernie4_5_VLMoeForCausalLM", "methods": [ { "kind": "function", "name": "Ernie4_5_VLMoeForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ernie4_5_VLMoeForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VLMoeForCausalLM.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Ernie4_5_VLMoeForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VLMoeForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_VLMoeForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Ernie4_5_VLMoeForCausalLM.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Ernie4_5_VLMoeForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 14, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl_moe.Ernie4_5_VLMoeModel", "methods": [ { "kind": "function", "name": "Ernie4_5_VLMoeModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ernie4_5_VLMoeModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie4_5_VLMoeModel.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_VLMoeModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeModel.im_patch_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl_moe.Ernie4_5_VLMoeDecoderLayer", "methods": [ { "kind": "function", "name": "Ernie4_5_VLMoeDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Ernie4_5_VLMoeDecoderLayer.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_VLMoeDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeDecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl_moe.Ernie4_5_VLMoeMLP", "methods": [ { "kind": "function", "name": "Ernie4_5_VLMoeMLP.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ernie4_5_VLMoeMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_VLMoeMLP.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.ernie45_vl_moe.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.ernie45_vl_moe.Ernie4_5_VLMoeAttention", "methods": [ { "kind": "function", "name": "Ernie4_5_VLMoeAttention.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "Ernie4_5_VLMoeAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie4_5_VLMoeAttention.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie4_5_VLMoeAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 16, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 14, "n_attrs": 15, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.ernie45_vl_moe", "names": [ "vllm.model_executor.models.ernie45_vl_moe.Ernie4_5_VLMoeAttention", "vllm.model_executor.models.ernie45_vl_moe.Ernie4_5_VLMoeDecoderLayer", "vllm.model_executor.models.ernie45_vl_moe.Ernie4_5_VLMoeForCausalLM", "vllm.model_executor.models.ernie45_vl_moe.Ernie4_5_VLMoeMLP", "vllm.model_executor.models.ernie45_vl_moe.Ernie4_5_VLMoeMoE", "vllm.model_executor.models.ernie45_vl_moe.Ernie4_5_VLMoeModel", "vllm.model_executor.models.ernie45_vl_moe.logger" ], "n_typable": 112, "n_typed": 60, "n_any": 0, "n_untyped": 52, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 51, "n_classes": 6, "n_attrs": 47, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/ernie_mtp.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.ernie_mtp.ErnieMultiTokenPredictorLayer", "methods": [ { "kind": "function", "name": "ErnieMultiTokenPredictorLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ErnieMultiTokenPredictorLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ErnieMultiTokenPredictorLayer.mtp_emb_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ErnieMultiTokenPredictorLayer.mtp_hidden_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ErnieMultiTokenPredictorLayer.mtp_linear_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ErnieMultiTokenPredictorLayer.mtp_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie_mtp.ErnieMultiTokenPredictor", "methods": [ { "kind": "function", "name": "ErnieMultiTokenPredictor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ErnieMultiTokenPredictor.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ErnieMultiTokenPredictor.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ErnieMultiTokenPredictor.compute_logits", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ErnieMultiTokenPredictor.mtp_start_layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ErnieMultiTokenPredictor.num_mtp_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ErnieMultiTokenPredictor.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ErnieMultiTokenPredictor.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ErnieMultiTokenPredictor.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 14, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ernie_mtp.ErnieMTP", "methods": [ { "kind": "function", "name": "ErnieMTP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ErnieMTP.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ErnieMTP.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ErnieMTP.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ErnieMTP.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ErnieMTP._rewrite_spec_layer_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ErnieMTP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ErnieMTP.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ErnieMTP.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 19, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.ernie_mtp", "names": [ "vllm.model_executor.models.ernie_mtp.ErnieMTP", "vllm.model_executor.models.ernie_mtp.ErnieMultiTokenPredictor", "vllm.model_executor.models.ernie_mtp.ErnieMultiTokenPredictorLayer" ], "n_typable": 55, "n_typed": 41, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 31, "n_classes": 3, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/exaone.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.exaone.ExaoneModel", "methods": [ { "kind": "function", "name": "ExaoneModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExaoneModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExaoneModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ExaoneModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExaoneModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneModel.wte", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneModel.ln_f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.exaone.ExaoneBlockAttention", "methods": [ { "kind": "function", "name": "ExaoneBlockAttention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "ExaoneBlockAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExaoneBlockAttention.attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.exaone.ExaoneGatedMLP", "methods": [ { "kind": "function", "name": "ExaoneGatedMLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ExaoneGatedMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExaoneGatedMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneGatedMLP.c_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneGatedMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.exaone.ExaoneForCausalLM", "methods": [ { "kind": "function", "name": "ExaoneForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExaoneForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExaoneForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ExaoneForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExaoneForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExaoneForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExaoneForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExaoneForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneForCausalLM.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.exaone.ExaoneAttention", "methods": [ { "kind": "function", "name": "ExaoneAttention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "ExaoneAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExaoneAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 13, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.exaone.ExaoneDecoderLayer", "methods": [ { "kind": "function", "name": "ExaoneDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ExaoneDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExaoneDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneDecoderLayer.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneDecoderLayer.ln_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneDecoderLayer.ln_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.exaone", "names": [ "vllm.model_executor.models.exaone.ExaoneAttention", "vllm.model_executor.models.exaone.ExaoneBlockAttention", "vllm.model_executor.models.exaone.ExaoneDecoderLayer", "vllm.model_executor.models.exaone.ExaoneForCausalLM", "vllm.model_executor.models.exaone.ExaoneGatedMLP", "vllm.model_executor.models.exaone.ExaoneModel" ], "n_typable": 105, "n_typed": 66, "n_any": 0, "n_untyped": 39, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 53, "n_classes": 6, "n_attrs": 37, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/exaone4.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.exaone4.Exaone4Attention", "methods": [ { "kind": "function", "name": "Exaone4Attention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "Exaone4Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Exaone4Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.apply_rope_all_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 13, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.exaone4.Exaone4ForCausalLM", "methods": [ { "kind": "function", "name": "Exaone4ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Exaone4ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Exaone4ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Exaone4ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Exaone4ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Exaone4ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Exaone4ForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Exaone4ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4ForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.exaone4.Exaone4GatedMLP", "methods": [ { "kind": "function", "name": "Exaone4GatedMLP.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Exaone4GatedMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Exaone4GatedMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4GatedMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4GatedMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.exaone4.Exaone4Model", "methods": [ { "kind": "function", "name": "Exaone4Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Exaone4Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Exaone4Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Exaone4Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Exaone4Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Model.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.exaone4.Exaone4DecoderLayer", "methods": [ { "kind": "function", "name": "Exaone4DecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Exaone4DecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Exaone4DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Exaone4DecoderLayer.post_feedforward_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.exaone4", "names": [ "vllm.model_executor.models.exaone4.Exaone4Attention", "vllm.model_executor.models.exaone4.Exaone4DecoderLayer", "vllm.model_executor.models.exaone4.Exaone4ForCausalLM", "vllm.model_executor.models.exaone4.Exaone4GatedMLP", "vllm.model_executor.models.exaone4.Exaone4Model" ], "n_typable": 96, "n_typed": 54, "n_any": 0, "n_untyped": 42, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 43, "n_classes": 5, "n_attrs": 40, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/exaone_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.exaone_moe.ExaoneMoe", "methods": [ { "kind": "function", "name": "ExaoneMoe.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ExaoneMoe.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExaoneMoe.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.n_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.e_score_correction_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoe.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 6, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.exaone_moe.ExaoneMoeModel", "methods": [ { "kind": "function", "name": "ExaoneMoeModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExaoneMoeModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExaoneMoeModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ExaoneMoeModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ExaoneMoeModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExaoneMoeModel.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 12, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.exaone_moe.ExaoneMoeForCausalLM", "methods": [ { "kind": "function", "name": "ExaoneMoeForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExaoneMoeForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExaoneMoeForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ExaoneMoeForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExaoneMoeForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExaoneMoeForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExaoneMoeForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExaoneMoeForCausalLM.embedding_padding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExaoneMoeForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeForCausalLM.lora_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeForCausalLM.unpadded_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 13, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.exaone_moe.ExaoneMoeDecoderLayer", "methods": [ { "kind": "function", "name": "ExaoneMoeDecoderLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ExaoneMoeDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExaoneMoeDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.exaone_moe", "names": [ "vllm.model_executor.models.exaone_moe.ExaoneMoe", "vllm.model_executor.models.exaone_moe.ExaoneMoeDecoderLayer", "vllm.model_executor.models.exaone_moe.ExaoneMoeForCausalLM", "vllm.model_executor.models.exaone_moe.ExaoneMoeModel" ], "n_typable": 81, "n_typed": 41, "n_any": 0, "n_untyped": 40, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 30, "n_classes": 4, "n_attrs": 40, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/exaone_moe_mtp.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.exaone_moe_mtp.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.exaone_moe_mtp.ExaoneMoeMultiTokenPredictor", "methods": [ { "kind": "function", "name": "ExaoneMoeMultiTokenPredictor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExaoneMoeMultiTokenPredictor.get_input_embeddings", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExaoneMoeMultiTokenPredictor.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ExaoneMoeMultiTokenPredictor.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExaoneMoeMultiTokenPredictor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMultiTokenPredictor.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMultiTokenPredictor.org_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMultiTokenPredictor.mtp_start_layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMultiTokenPredictor.num_mtp_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMultiTokenPredictor.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMultiTokenPredictor.fc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMultiTokenPredictor.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMultiTokenPredictor.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMultiTokenPredictor.pre_fc_norm_hidden", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMultiTokenPredictor.pre_fc_norm_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 13, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.exaone_moe_mtp.ExaoneMoeMTP", "methods": [ { "kind": "function", "name": "ExaoneMoeMTP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExaoneMoeMTP.get_input_embeddings", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExaoneMoeMTP.forward", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "ExaoneMoeMTP.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExaoneMoeMTP.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExaoneMoeMTP.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMTP.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMTP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMTP.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMTP.unpadded_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMTP.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExaoneMoeMTP.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 16, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.exaone_moe_mtp.KVCache", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.exaone_moe_mtp", "names": [ "vllm.model_executor.models.exaone_moe_mtp.ExaoneMoeMTP", "vllm.model_executor.models.exaone_moe_mtp.ExaoneMoeMultiTokenPredictor", "vllm.model_executor.models.exaone_moe_mtp.KVCache", "vllm.model_executor.models.exaone_moe_mtp.logger" ], "n_typable": 51, "n_typed": 29, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 23, "n_classes": 2, "n_attrs": 20, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/extract_hidden_states.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.extract_hidden_states.CacheOnlyAttentionLayer", "methods": [ { "kind": "function", "name": "CacheOnlyAttentionLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CacheOnlyAttentionLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CacheOnlyAttentionLayer.get_attn_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CacheOnlyAttentionLayer.get_kv_cache_spec", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CacheOnlyAttentionLayer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CacheOnlyAttentionLayer.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CacheOnlyAttentionLayer.layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CacheOnlyAttentionLayer.kv_cache_torch_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CacheOnlyAttentionLayer.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CacheOnlyAttentionLayer.impl", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CacheOnlyAttentionLayer.kv_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CacheOnlyAttentionLayer.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 10, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.extract_hidden_states.CacheOnlyAttentionBackend", "methods": [ { "kind": "function", "name": "CacheOnlyAttentionBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CacheOnlyAttentionBackend.supports_attn_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CacheOnlyAttentionBackend.supports_mm_prefix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CacheOnlyAttentionBackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CacheOnlyAttentionBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CacheOnlyAttentionBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CacheOnlyAttentionBackend.use_cascade_attention", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CacheOnlyAttentionBackend.get_supported_head_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CacheOnlyAttentionBackend.accept_output_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheOnlyAttentionBackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheOnlyAttentionBackend.supported_kv_cache_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CacheOnlyAttentionBackend.forward_includes_kv_cache_update", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 20, "n_typed": 18, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.extract_hidden_states.ExtractHiddenStatesModel", "methods": [ { "kind": "function", "name": "ExtractHiddenStatesModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExtractHiddenStatesModel.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExtractHiddenStatesModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExtractHiddenStatesModel.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesModel.hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesModel.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesModel.target_num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesModel.num_hidden_states", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesModel.cache_only_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 6, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.extract_hidden_states.unified_kv_cache_update", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.extract_hidden_states.CacheOnlyAttentionImpl", "methods": [ { "kind": "function", "name": "CacheOnlyAttentionImpl.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CacheOnlyAttentionImpl.do_kv_cache_update", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CacheOnlyAttentionImpl.forward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CacheOnlyAttentionImpl.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CacheOnlyAttentionImpl.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CacheOnlyAttentionImpl.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CacheOnlyAttentionImpl.kv_cache_torch_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CacheOnlyAttentionImpl.num_queries_per_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 6, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.extract_hidden_states.CacheOnlyAttentionMetadata", "methods": [ { "kind": "function", "name": "CacheOnlyAttentionMetadata.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CacheOnlyAttentionMetadata.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.extract_hidden_states.CacheOnlyAttentionMetadataBuilder", "methods": [ { "kind": "function", "name": "CacheOnlyAttentionMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CacheOnlyAttentionMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.extract_hidden_states.basic_cache", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.models.extract_hidden_states.dummy_attention", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.model_executor.models.extract_hidden_states", "names": [ "vllm.model_executor.models.extract_hidden_states.CacheOnlyAttentionBackend", "vllm.model_executor.models.extract_hidden_states.CacheOnlyAttentionImpl", "vllm.model_executor.models.extract_hidden_states.CacheOnlyAttentionLayer", "vllm.model_executor.models.extract_hidden_states.CacheOnlyAttentionMetadata", "vllm.model_executor.models.extract_hidden_states.CacheOnlyAttentionMetadataBuilder", "vllm.model_executor.models.extract_hidden_states.ExtractHiddenStatesModel", "vllm.model_executor.models.extract_hidden_states.basic_cache", "vllm.model_executor.models.extract_hidden_states.dummy_attention", "vllm.model_executor.models.extract_hidden_states.unified_kv_cache_update" ], "n_typable": 93, "n_typed": 55, "n_any": 0, "n_untyped": 38, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 7, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 38, "n_classes": 6, "n_attrs": 24, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/fairseq2_llama.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.fairseq2_llama.Fairseq2LlamaForCausalLM", "methods": [ { "kind": "function", "name": "Fairseq2LlamaForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Fairseq2LlamaForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Fairseq2LlamaForCausalLM.flag_sharded_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Fairseq2LlamaForCausalLM.reshape_fairseq2_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Fairseq2LlamaForCausalLM.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fairseq2LlamaForCausalLM.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Fairseq2LlamaForCausalLM.allow_patterns_overrides", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.fairseq2_llama", "names": [ "vllm.model_executor.models.fairseq2_llama.Fairseq2LlamaForCausalLM" ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/falcon.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.falcon.FalconModel", "methods": [ { "kind": "function", "name": "FalconModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FalconModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FalconModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FalconModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FalconModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconModel.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconModel.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconModel.use_alibi", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconModel.word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconModel.ln_f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 11, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.falcon.FalconConfig", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.falcon.FalconMLP", "methods": [ { "kind": "function", "name": "FalconMLP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FalconMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FalconMLP.dense_h_to_4h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconMLP.reduce_row_parallel_results", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconMLP.dense_4h_to_h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.falcon.FalconAttention", "methods": [ { "kind": "function", "name": "FalconAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FalconAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FalconAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.new_decoder_architecture", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.multi_query", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.query_key_value", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.inv_norm_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.reduce_row_parallel_results", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.use_rotary", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.use_alibi", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 7, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.falcon.FalconForCausalLM", "methods": [ { "kind": "function", "name": "FalconForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FalconForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FalconForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FalconForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FalconForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FalconForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FalconForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconForCausalLM.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconForCausalLM.tie_word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 13, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.falcon.FalconDecoderLayer", "methods": [ { "kind": "function", "name": "FalconDecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FalconDecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FalconDecoderLayer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconDecoderLayer.self_attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconDecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconDecoderLayer.reduce_row_parallel_results", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconDecoderLayer.ln_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconDecoderLayer.ln_mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 7, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.falcon", "names": [ "vllm.model_executor.models.falcon.FalconAttention", "vllm.model_executor.models.falcon.FalconConfig", "vllm.model_executor.models.falcon.FalconDecoderLayer", "vllm.model_executor.models.falcon.FalconForCausalLM", "vllm.model_executor.models.falcon.FalconMLP", "vllm.model_executor.models.falcon.FalconModel" ], "n_typable": 94, "n_typed": 44, "n_any": 0, "n_untyped": 50, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 33, "n_classes": 5, "n_attrs": 47, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/falcon_h1.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.falcon_h1.FalconH1MLP", "methods": [ { "kind": "function", "name": "FalconH1MLP.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FalconH1MLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FalconH1MLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1MLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1MLP.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1MLP.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1MLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 5, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.falcon_h1.FalconH1ForCausalLM", "methods": [ { "kind": "function", "name": "FalconH1ForCausalLM.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FalconH1ForCausalLM.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FalconH1ForCausalLM.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FalconH1ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FalconH1ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FalconH1ForCausalLM.forward", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FalconH1ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FalconH1ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FalconH1ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FalconH1ForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FalconH1ForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ForCausalLM.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ForCausalLM.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ForCausalLM.tie_word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ForCausalLM.lm_head_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 17, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 12, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.falcon_h1.FalconH1AttentionDecoderLayer", "methods": [ { "kind": "function", "name": "FalconH1AttentionDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FalconH1AttentionDecoderLayer.self_attention", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FalconH1AttentionDecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FalconH1AttentionDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1AttentionDecoderLayer.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1AttentionDecoderLayer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1AttentionDecoderLayer.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1AttentionDecoderLayer.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1AttentionDecoderLayer.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1AttentionDecoderLayer.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1AttentionDecoderLayer.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1AttentionDecoderLayer.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1AttentionDecoderLayer.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1AttentionDecoderLayer.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1AttentionDecoderLayer.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1AttentionDecoderLayer.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1AttentionDecoderLayer.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1AttentionDecoderLayer.key_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 11, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.falcon_h1.FalconH1ParallelHybrid", "methods": [ { "kind": "function", "name": "FalconH1ParallelHybrid.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FalconH1ParallelHybrid.forward", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FalconH1ParallelHybrid.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ParallelHybrid.mamba", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ParallelHybrid.ssm_out_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ParallelHybrid.ssm_in_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ParallelHybrid.attention_in_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ParallelHybrid.attn_out_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ParallelHybrid.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ParallelHybrid.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1ParallelHybrid.pre_ff_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 9, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.falcon_h1.FalconH1SSMDecoderLayer", "methods": [ { "kind": "function", "name": "FalconH1SSMDecoderLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FalconH1SSMDecoderLayer._init_mup_vector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FalconH1SSMDecoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FalconH1SSMDecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1SSMDecoderLayer.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1SSMDecoderLayer.d_ssm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1SSMDecoderLayer.mamba", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1SSMDecoderLayer.groups_time_state_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1SSMDecoderLayer.zxbcdt_multipliers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 8, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.falcon_h1.FalconH1Model", "methods": [ { "kind": "function", "name": "FalconH1Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FalconH1Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FalconH1Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FalconH1Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1Model.embedding_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FalconH1Model.final_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 9, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.falcon_h1", "names": [ "vllm.model_executor.models.falcon_h1.FalconH1AttentionDecoderLayer", "vllm.model_executor.models.falcon_h1.FalconH1ForCausalLM", "vllm.model_executor.models.falcon_h1.FalconH1MLP", "vllm.model_executor.models.falcon_h1.FalconH1Model", "vllm.model_executor.models.falcon_h1.FalconH1ParallelHybrid", "vllm.model_executor.models.falcon_h1.FalconH1SSMDecoderLayer" ], "n_typable": 125, "n_typed": 59, "n_any": 0, "n_untyped": 66, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 52, "n_classes": 6, "n_attrs": 54, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/fireredasr2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.FireRedASR2MultiModalProcessor", "methods": [ { "kind": "function", "name": "FireRedASR2MultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FireRedASR2MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FireRedASR2MultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.ConformerEncoder", "methods": [ { "kind": "function", "name": "ConformerEncoder.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ConformerEncoder.forward", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ConformerEncoder.padding_position_is_0", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ConformerEncoder.odim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerEncoder.input_preprocessor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerEncoder.positional_encoding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerEncoder.layer_stack", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 12, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.FireRedASR2ProcessingInfo", "methods": [ { "kind": "function", "name": "FireRedASR2ProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FireRedASR2ProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FireRedASR2ProcessingInfo.get_feature_extractor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FireRedASR2ProcessingInfo.get_data_parser", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FireRedASR2ProcessingInfo.get_target_channels", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.Swish", "methods": [ { "kind": "function", "name": "Swish.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.EncoderMultiHeadAttention", "methods": [ { "kind": "function", "name": "EncoderMultiHeadAttention.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EncoderMultiHeadAttention.forward_qkv", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EncoderMultiHeadAttention.forward_output", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EncoderMultiHeadAttention.forward_attention", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EncoderMultiHeadAttention.n_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderMultiHeadAttention.d_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderMultiHeadAttention.d_v", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderMultiHeadAttention.w_qs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderMultiHeadAttention.w_ks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderMultiHeadAttention.w_vs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderMultiHeadAttention.layer_norm_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderMultiHeadAttention.layer_norm_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderMultiHeadAttention.layer_norm_v", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderMultiHeadAttention.fc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 15, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.ConformerConvolution", "methods": [ { "kind": "function", "name": "ConformerConvolution.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ConformerConvolution.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ConformerConvolution.pre_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerConvolution.pointwise_conv1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerConvolution.padding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerConvolution.depthwise_conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerConvolution.batch_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerConvolution.swish", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerConvolution.pointwise_conv2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 5, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.FireRedASR2Encoder", "methods": [ { "kind": "function", "name": "FireRedASR2Encoder.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FireRedASR2Encoder.audio_encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.FireRedASR2Model", "methods": [ { "kind": "function", "name": "FireRedASR2Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FireRedASR2Model.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FireRedASR2Model.get_encoder_outputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FireRedASR2Model.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2Model.encoder_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2Model.decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 9, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.RelPosMultiHeadAttention", "methods": [ { "kind": "function", "name": "RelPosMultiHeadAttention.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RelPosMultiHeadAttention._rel_shift", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RelPosMultiHeadAttention.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RelPosMultiHeadAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RelPosMultiHeadAttention.linear_pos", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RelPosMultiHeadAttention.pos_bias_u", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RelPosMultiHeadAttention.pos_bias_v", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 8, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.FireRedASR2Adapter", "methods": [ { "kind": "function", "name": "FireRedASR2Adapter.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FireRedASR2Adapter.forward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FireRedASR2Adapter.ds", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2Adapter.linear1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2Adapter.relu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2Adapter.linear2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 3, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.FireRedASR2DummyInputsBuilder", "methods": [ { "kind": "function", "name": "FireRedASR2DummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FireRedASR2DummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.FireRedASR2ForConditionalGeneration", "methods": [ { "kind": "function", "name": "FireRedASR2ForConditionalGeneration.validate_language", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FireRedASR2ForConditionalGeneration.get_generation_prompt", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "FireRedASR2ForConditionalGeneration.get_speech_to_text_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FireRedASR2ForConditionalGeneration.get_num_audio_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FireRedASR2ForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FireRedASR2ForConditionalGeneration.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FireRedASR2ForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FireRedASR2ForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FireRedASR2ForConditionalGeneration._parse_and_validate_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FireRedASR2ForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FireRedASR2ForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FireRedASR2ForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FireRedASR2ForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2ForConditionalGeneration.supports_transcription_only", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FireRedASR2ForConditionalGeneration.supports_segment_timestamp", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FireRedASR2ForConditionalGeneration.supported_languages", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FireRedASR2ForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2ForConditionalGeneration.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2ForConditionalGeneration.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2ForConditionalGeneration.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 43, "n_typed": 36, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 27, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.FireRedASR2AudioInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FireRedASR2AudioInputs.input_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2AudioInputs.speech_lengths", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2AudioInputs.fake_token_lengths", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.Conv2dSubsampling", "methods": [ { "kind": "function", "name": "Conv2dSubsampling.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Conv2dSubsampling.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Conv2dSubsampling.conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Conv2dSubsampling.out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Conv2dSubsampling.subsampling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Conv2dSubsampling.context", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.RelPositionalEncoding", "methods": [ { "kind": "function", "name": "RelPositionalEncoding.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RelPositionalEncoding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RelPositionalEncoding.pe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.fireredasr2.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.ConformerFeedForward", "methods": [ { "kind": "function", "name": "ConformerFeedForward.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConformerFeedForward.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ConformerFeedForward.pre_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerFeedForward.linear_expand", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerFeedForward.nonlinear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerFeedForward.linear_project", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 3, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fireredasr2.RelPosEmbConformerBlock", "methods": [ { "kind": "function", "name": "RelPosEmbConformerBlock.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RelPosEmbConformerBlock.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RelPosEmbConformerBlock.ffn1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RelPosEmbConformerBlock.mhsa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RelPosEmbConformerBlock.conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RelPosEmbConformerBlock.ffn2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RelPosEmbConformerBlock.layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 5, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.fireredasr2", "names": [ "vllm.model_executor.models.fireredasr2.ConformerConvolution", "vllm.model_executor.models.fireredasr2.ConformerEncoder", "vllm.model_executor.models.fireredasr2.ConformerFeedForward", "vllm.model_executor.models.fireredasr2.Conv2dSubsampling", "vllm.model_executor.models.fireredasr2.EncoderMultiHeadAttention", "vllm.model_executor.models.fireredasr2.FireRedASR2Adapter", "vllm.model_executor.models.fireredasr2.FireRedASR2AudioInputs", "vllm.model_executor.models.fireredasr2.FireRedASR2DummyInputsBuilder", "vllm.model_executor.models.fireredasr2.FireRedASR2Encoder", "vllm.model_executor.models.fireredasr2.FireRedASR2ForConditionalGeneration", "vllm.model_executor.models.fireredasr2.FireRedASR2Model", "vllm.model_executor.models.fireredasr2.FireRedASR2MultiModalProcessor", "vllm.model_executor.models.fireredasr2.FireRedASR2ProcessingInfo", "vllm.model_executor.models.fireredasr2.RelPosEmbConformerBlock", "vllm.model_executor.models.fireredasr2.RelPosMultiHeadAttention", "vllm.model_executor.models.fireredasr2.RelPositionalEncoding", "vllm.model_executor.models.fireredasr2.Swish", "vllm.model_executor.models.fireredasr2.logger" ], "n_typable": 211, "n_typed": 136, "n_any": 0, "n_untyped": 75, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 48, "n_method_overloads": 48, "n_method_params": 107, "n_classes": 17, "n_attrs": 60, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/flex_olmo.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.flex_olmo.FlexOlmoDecoderLayer", "methods": [ { "kind": "function", "name": "FlexOlmoDecoderLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlexOlmoDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlexOlmoDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoDecoderLayer.post_feedforward_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.flex_olmo.FlexOlmoMoE", "methods": [ { "kind": "function", "name": "FlexOlmoMoE.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlexOlmoMoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlexOlmoMoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoMoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoMoE.top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 4, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.flex_olmo.FlexOlmoForCausalLM", "methods": [ { "kind": "function", "name": "FlexOlmoForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlexOlmoForCausalLM.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.flex_olmo.FlexOlmoAttention", "methods": [ { "kind": "function", "name": "FlexOlmoAttention.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlexOlmoAttention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoAttention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.flex_olmo.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.flex_olmo", "names": [ "vllm.model_executor.models.flex_olmo.FlexOlmoAttention", "vllm.model_executor.models.flex_olmo.FlexOlmoDecoderLayer", "vllm.model_executor.models.flex_olmo.FlexOlmoForCausalLM", "vllm.model_executor.models.flex_olmo.FlexOlmoMoE", "vllm.model_executor.models.flex_olmo.logger" ], "n_typable": 29, "n_typed": 16, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 13, "n_classes": 4, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/funasr.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.funasr.MultiHeadedAttentionSANM", "methods": [ { "kind": "function", "name": "MultiHeadedAttentionSANM.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MultiHeadedAttentionSANM.forward_fsmn", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MultiHeadedAttentionSANM.forward_qkv", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiHeadedAttentionSANM.forward_attention", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MultiHeadedAttentionSANM.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiHeadedAttentionSANM.d_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttentionSANM.h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttentionSANM.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttentionSANM.linear_q_k_v", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttentionSANM.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttentionSANM.fsmn_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttentionSANM.pad_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 17, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 17, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funasr.FunASRForConditionalGeneration", "methods": [ { "kind": "function", "name": "FunASRForConditionalGeneration.validate_language", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunASRForConditionalGeneration.get_generation_prompt", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "FunASRForConditionalGeneration.get_speech_to_text_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FunASRForConditionalGeneration.get_num_audio_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FunASRForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FunASRForConditionalGeneration.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FunASRForConditionalGeneration.get_language_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FunASRForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunASRForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FunASRForConditionalGeneration._parse_and_validate_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunASRForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunASRForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FunASRForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FunASRForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRForConditionalGeneration.supports_transcription_only", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FunASRForConditionalGeneration.supports_segment_timestamp", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FunASRForConditionalGeneration.supported_languages", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FunASRForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRForConditionalGeneration.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRForConditionalGeneration.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRForConditionalGeneration.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRForConditionalGeneration.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 45, "n_typed": 37, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 27, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funasr.LayerNorm", "methods": [ { "kind": "function", "name": "LayerNorm.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LayerNorm.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LayerNorm.dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funasr.FunASREncoder", "methods": [ { "kind": "function", "name": "FunASREncoder.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FunASREncoder.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FunASREncoder.audio_encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASREncoder.audio_adaptor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funasr.FunASRDummyInputsBuilder", "methods": [ { "kind": "function", "name": "FunASRDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunASRDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funasr.SinusoidalPositionEncoder", "methods": [ { "kind": "function", "name": "SinusoidalPositionEncoder.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SinusoidalPositionEncoder.encode", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SinusoidalPositionEncoder.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 4, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funasr.EncoderLayer", "methods": [ { "kind": "function", "name": "EncoderLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EncoderLayer.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderLayer.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderLayer.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderLayer.norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 4, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funasr.FunASRAudioAttention", "methods": [ { "kind": "function", "name": "FunASRAudioAttention.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FunASRAudioAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FunASRAudioAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRAudioAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRAudioAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRAudioAttention.num_local_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRAudioAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRAudioAttention.qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRAudioAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRAudioAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 7, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funasr.SenseVoiceEncoderSmall", "methods": [ { "kind": "function", "name": "SenseVoiceEncoderSmall.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "SenseVoiceEncoderSmall.output_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SenseVoiceEncoderSmall.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SenseVoiceEncoderSmall.embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SenseVoiceEncoderSmall.normalize_before", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SenseVoiceEncoderSmall.encoders0", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SenseVoiceEncoderSmall.encoders", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SenseVoiceEncoderSmall.tp_encoders", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SenseVoiceEncoderSmall.after_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SenseVoiceEncoderSmall.tp_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 13, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 13, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funasr.Transformer", "methods": [ { "kind": "function", "name": "Transformer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Transformer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Transformer.k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Transformer.encoder_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Transformer.llm_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Transformer.linear1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Transformer.relu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Transformer.linear2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Transformer.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 4, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.funasr.sequence_mask", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.funasr.FunASRAudioInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FunASRAudioInputs.input_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FunASRAudioInputs.speech_lengths", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funasr.FunASRProcessingInfo", "methods": [ { "kind": "function", "name": "FunASRProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FunASRProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FunASRProcessingInfo.get_feature_extractor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunASRProcessingInfo.get_data_parser", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FunASRProcessingInfo.get_target_channels", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FunASRProcessingInfo.get_num_audio_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funasr.FunASRMultiModalProcessor", "methods": [ { "kind": "function", "name": "FunASRMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FunASRMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FunASRMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funasr.EncoderLayerSANM", "methods": [ { "kind": "function", "name": "EncoderLayerSANM.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "EncoderLayerSANM.forward", "n_typed": 2, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EncoderLayerSANM.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderLayerSANM.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderLayerSANM.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderLayerSANM.norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderLayerSANM.in_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderLayerSANM.size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderLayerSANM.normalize_before", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 6, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funasr.PositionwiseFeedForward", "methods": [ { "kind": "function", "name": "PositionwiseFeedForward.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PositionwiseFeedForward.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PositionwiseFeedForward.w_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PositionwiseFeedForward.w_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PositionwiseFeedForward.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 3, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.funasr.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.funasr.FunASRModel", "methods": [ { "kind": "function", "name": "FunASRModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FunASRModel.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FunASRModel.get_encoder_outputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FunASRModel.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRModel.decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.funasr", "names": [ "vllm.model_executor.models.funasr.EncoderLayer", "vllm.model_executor.models.funasr.EncoderLayerSANM", "vllm.model_executor.models.funasr.FunASRAudioAttention", "vllm.model_executor.models.funasr.FunASRAudioInputs", "vllm.model_executor.models.funasr.FunASRDummyInputsBuilder", "vllm.model_executor.models.funasr.FunASREncoder", "vllm.model_executor.models.funasr.FunASRForConditionalGeneration", "vllm.model_executor.models.funasr.FunASRModel", "vllm.model_executor.models.funasr.FunASRMultiModalProcessor", "vllm.model_executor.models.funasr.FunASRProcessingInfo", "vllm.model_executor.models.funasr.LayerNorm", "vllm.model_executor.models.funasr.MultiHeadedAttentionSANM", "vllm.model_executor.models.funasr.PositionwiseFeedForward", "vllm.model_executor.models.funasr.SenseVoiceEncoderSmall", "vllm.model_executor.models.funasr.SinusoidalPositionEncoder", "vllm.model_executor.models.funasr.Transformer", "vllm.model_executor.models.funasr.logger", "vllm.model_executor.models.funasr.sequence_mask" ], "n_typable": 234, "n_typed": 137, "n_any": 0, "n_untyped": 97, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 51, "n_method_overloads": 51, "n_method_params": 121, "n_classes": 16, "n_attrs": 61, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/funaudiochat.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.funaudiochat.FunAudioChatDummyInputsBuilder", "methods": [ { "kind": "function", "name": "FunAudioChatDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunAudioChatDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funaudiochat.FunAudioChatProcessingInfo", "methods": [ { "kind": "function", "name": "FunAudioChatProcessingInfo.get_feature_extractor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FunAudioChatProcessingInfo.get_speech_tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FunAudioChatProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FunAudioChatProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FunAudioChatProcessingInfo.get_target_channels", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FunAudioChatProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FunAudioChatProcessingInfo.get_audio_group_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "FunAudioChatProcessingInfo.feature_extractor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "FunAudioChatProcessingInfo.speech_tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FunAudioChatProcessingInfo.token_fps", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 2, "n_attrs": 1, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.funaudiochat.FunAudioChatDiscreteEncoder", "methods": [ { "kind": "function", "name": "FunAudioChatDiscreteEncoder.__init__", "n_typed": 0, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunAudioChatDiscreteEncoder.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FunAudioChatDiscreteEncoder._get_feat_extract_output_lengths", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FunAudioChatDiscreteEncoder.padding_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatDiscreteEncoder.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatDiscreteEncoder.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatDiscreteEncoder.continuous_features_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatDiscreteEncoder.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatDiscreteEncoder.output_matching", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatDiscreteEncoder.continual_output_matching", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 7, "n_any": 1, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funaudiochat.FunAudioChatAudioEncoder", "methods": [ { "kind": "function", "name": "FunAudioChatAudioEncoder.__init__", "n_typed": 0, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunAudioChatAudioEncoder._prepare_attention_mask", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FunAudioChatAudioEncoder.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FunAudioChatAudioEncoder.padded_and_mask_function", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FunAudioChatAudioEncoder._get_feat_extract_output_lengths", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "FunAudioChatAudioEncoder.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FunAudioChatAudioEncoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoder.num_mel_bins", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoder.max_source_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoder.embed_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoder.n_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoder.conv1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoder.conv2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoder.ln_post", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoder.avg_pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoder.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoder.positional_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoder.audio_bos_eos_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 17, "n_any": 1, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_attrs": 13, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.funaudiochat.FunAudioChatForConditionalGeneration", "methods": [ { "kind": "function", "name": "FunAudioChatForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FunAudioChatForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FunAudioChatForConditionalGeneration._get_continuous_audio_features", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FunAudioChatForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunAudioChatForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FunAudioChatForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunAudioChatForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FunAudioChatForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatForConditionalGeneration.continuous_audio_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatForConditionalGeneration.audio_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 21, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 15, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funaudiochat.FunAudioChatAudioAttention", "methods": [ { "kind": "function", "name": "FunAudioChatAudioAttention.__init__", "n_typed": 0, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunAudioChatAudioAttention.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunAudioChatAudioAttention.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FunAudioChatAudioAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.num_key_value_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.is_decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.is_causal", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 7, "n_any": 1, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funaudiochat.FunAudioChatAudioEncoderLayer", "methods": [ { "kind": "function", "name": "FunAudioChatAudioEncoderLayer.__init__", "n_typed": 0, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunAudioChatAudioEncoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FunAudioChatAudioEncoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderLayer.self_attn_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderLayer.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderLayer.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderLayer.activation_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderLayer.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderLayer.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderLayer.final_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 5, "n_any": 1, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.funaudiochat.FunAudioChatMultiModalProcessor", "methods": [ { "kind": "function", "name": "FunAudioChatMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FunAudioChatMultiModalProcessor._hf_processor_applies_updates", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FunAudioChatMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FunAudioChatMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 17, "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.funaudiochat", "names": [ "vllm.model_executor.models.funaudiochat.FunAudioChatAudioAttention", "vllm.model_executor.models.funaudiochat.FunAudioChatAudioEncoder", "vllm.model_executor.models.funaudiochat.FunAudioChatAudioEncoderLayer", "vllm.model_executor.models.funaudiochat.FunAudioChatDiscreteEncoder", "vllm.model_executor.models.funaudiochat.FunAudioChatDummyInputsBuilder", "vllm.model_executor.models.funaudiochat.FunAudioChatForConditionalGeneration", "vllm.model_executor.models.funaudiochat.FunAudioChatMultiModalProcessor", "vllm.model_executor.models.funaudiochat.FunAudioChatProcessingInfo" ], "n_typable": 154, "n_typed": 91, "n_any": 4, "n_untyped": 59, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 33, "n_method_overloads": 33, "n_method_params": 64, "n_classes": 8, "n_attrs": 54, "n_properties": 3, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/fuyu.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.fuyu.FuyuProcessingInfo", "methods": [ { "kind": "function", "name": "FuyuProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FuyuProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FuyuProcessingInfo.get_image_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FuyuProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FuyuProcessingInfo.get_image_feature_grid_size", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FuyuProcessingInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FuyuProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 13, "n_typed": 11, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fuyu.FuyuDummyInputsBuilder", "methods": [ { "kind": "function", "name": "FuyuDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FuyuDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fuyu.FuyuImagePatchInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FuyuImagePatchInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FuyuImagePatchInputs.image_patches_flat", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FuyuImagePatchInputs.patches_per_image", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fuyu.FuyuMultiModalProcessor", "methods": [ { "kind": "function", "name": "FuyuMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FuyuMultiModalProcessor._apply_hf_processor_tokens_only", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FuyuMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FuyuMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 14, "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.fuyu.FuyuForCausalLM", "methods": [ { "kind": "function", "name": "FuyuForCausalLM.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FuyuForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FuyuForCausalLM._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FuyuForCausalLM._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FuyuForCausalLM.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FuyuForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FuyuForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FuyuForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FuyuForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FuyuForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FuyuForCausalLM.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FuyuForCausalLM.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FuyuForCausalLM.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FuyuForCausalLM.image_feature_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FuyuForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FuyuForCausalLM.vision_embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FuyuForCausalLM.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 20, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 14, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.fuyu", "names": [ "vllm.model_executor.models.fuyu.FuyuDummyInputsBuilder", "vllm.model_executor.models.fuyu.FuyuForCausalLM", "vllm.model_executor.models.fuyu.FuyuImagePatchInputs", "vllm.model_executor.models.fuyu.FuyuMultiModalProcessor", "vllm.model_executor.models.fuyu.FuyuProcessingInfo" ], "n_typable": 67, "n_typed": 54, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 34, "n_classes": 5, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/gemma.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.gemma.GemmaForCausalLM", "methods": [ { "kind": "function", "name": "GemmaForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GemmaForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GemmaForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GemmaForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GemmaForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GemmaForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GemmaForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 13, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma.GemmaDecoderLayer", "methods": [ { "kind": "function", "name": "GemmaDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GemmaDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GemmaDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma.GemmaMLP", "methods": [ { "kind": "function", "name": "GemmaMLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "GemmaMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GemmaMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma.GemmaModel", "methods": [ { "kind": "function", "name": "GemmaModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GemmaModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GemmaModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GemmaModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GemmaModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma.GemmaAttention", "methods": [ { "kind": "function", "name": "GemmaAttention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "GemmaAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GemmaAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GemmaAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 13, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 13, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.gemma.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.gemma", "names": [ "vllm.model_executor.models.gemma.GemmaAttention", "vllm.model_executor.models.gemma.GemmaDecoderLayer", "vllm.model_executor.models.gemma.GemmaForCausalLM", "vllm.model_executor.models.gemma.GemmaMLP", "vllm.model_executor.models.gemma.GemmaModel", "vllm.model_executor.models.gemma.logger" ], "n_typable": 88, "n_typed": 53, "n_any": 0, "n_untyped": 35, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 42, "n_classes": 5, "n_attrs": 32, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/gemma2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.gemma2.Gemma2Attention", "methods": [ { "kind": "function", "name": "Gemma2Attention.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "Gemma2Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma2Attention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 14, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma2.Gemma2MLP", "methods": [ { "kind": "function", "name": "Gemma2MLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Gemma2MLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma2MLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2MLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2MLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma2.Gemma2Model", "methods": [ { "kind": "function", "name": "Gemma2Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma2Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma2Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Gemma2Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma2Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Model.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma2.Gemma2DecoderLayer", "methods": [ { "kind": "function", "name": "Gemma2DecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Gemma2DecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma2DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2DecoderLayer.pre_feedforward_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2DecoderLayer.post_feedforward_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 9, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.gemma2.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.gemma2.Gemma2ForCausalLM", "methods": [ { "kind": "function", "name": "Gemma2ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma2ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma2ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Gemma2ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma2ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma2ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Gemma2ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2ForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma2ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 13, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.gemma2", "names": [ "vllm.model_executor.models.gemma2.Gemma2Attention", "vllm.model_executor.models.gemma2.Gemma2DecoderLayer", "vllm.model_executor.models.gemma2.Gemma2ForCausalLM", "vllm.model_executor.models.gemma2.Gemma2MLP", "vllm.model_executor.models.gemma2.Gemma2Model", "vllm.model_executor.models.gemma2.logger" ], "n_typable": 93, "n_typed": 56, "n_any": 0, "n_untyped": 37, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 43, "n_classes": 5, "n_attrs": 36, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/gemma3.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.gemma3.Gemma3DecoderLayer", "methods": [ { "kind": "function", "name": "Gemma3DecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Gemma3DecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3DecoderLayer.pre_feedforward_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3DecoderLayer.post_feedforward_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 9, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3.Gemma3MLP", "methods": [ { "kind": "function", "name": "Gemma3MLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Gemma3MLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3MLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3MLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3MLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3.Gemma3Attention", "methods": [ { "kind": "function", "name": "Gemma3Attention.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "Gemma3Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3Attention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.is_sliding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 14, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 13, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3.Gemma3Model", "methods": [ { "kind": "function", "name": "Gemma3Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Gemma3Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Model.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3.Gemma3ForCausalLM", "methods": [ { "kind": "function", "name": "Gemma3ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Gemma3ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Gemma3ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3ForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 13, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.gemma3.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.gemma3", "names": [ "vllm.model_executor.models.gemma3.Gemma3Attention", "vllm.model_executor.models.gemma3.Gemma3DecoderLayer", "vllm.model_executor.models.gemma3.Gemma3ForCausalLM", "vllm.model_executor.models.gemma3.Gemma3MLP", "vllm.model_executor.models.gemma3.Gemma3Model", "vllm.model_executor.models.gemma3.logger" ], "n_typable": 100, "n_typed": 55, "n_any": 0, "n_untyped": 45, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 46, "n_classes": 5, "n_attrs": 40, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/gemma3_mm.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.gemma3_mm.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3_mm.Gemma3MultiModalProjector", "methods": [ { "kind": "function", "name": "Gemma3MultiModalProjector.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3MultiModalProjector.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3MultiModalProjector.mm_input_projection_weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3MultiModalProjector.mm_soft_emb_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3MultiModalProjector.patches_per_image", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3MultiModalProjector.tokens_per_side", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3MultiModalProjector.kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3MultiModalProjector.avg_pool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 2, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3_mm.Gemma3DummyInputsBuilder", "methods": [ { "kind": "function", "name": "Gemma3DummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3DummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3_mm.Gemma3ProcessingInfo", "methods": [ { "kind": "function", "name": "Gemma3ProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Gemma3ProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3ProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Gemma3ProcessingInfo.get_num_crops", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Gemma3ProcessingInfo.get_image_repl", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Gemma3ProcessingInfo.get_num_image_tokens", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Gemma3ProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 20, "n_typed": 18, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 13, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3_mm.Gemma3ForConditionalGeneration", "methods": [ { "kind": "function", "name": "Gemma3ForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3ForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3ForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3ForConditionalGeneration._image_pixels_to_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3ForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3ForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3ForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Gemma3ForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Gemma3ForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3ForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3ForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Gemma3ForConditionalGeneration.get_num_mm_encoder_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3ForConditionalGeneration.get_num_mm_connector_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Gemma3ForConditionalGeneration.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Gemma3ForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Gemma3ForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3ForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3ForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3ForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3ForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3ForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3ForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3ForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 44, "n_typed": 34, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 22, "n_attrs": 9, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3_mm.Gemma3MultiModalProcessor", "methods": [ { "kind": "function", "name": "Gemma3MultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Gemma3MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3MultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Gemma3MultiModalProcessor._apply_token_matches", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3MultiModalProcessor._find_mm_placeholders", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 18, "n_typed": 18, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3_mm.Gemma3ImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3ImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3ImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3ImagePixelInputs.num_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.gemma3_mm", "names": [ "vllm.model_executor.models.gemma3_mm.Gemma3DummyInputsBuilder", "vllm.model_executor.models.gemma3_mm.Gemma3ForConditionalGeneration", "vllm.model_executor.models.gemma3_mm.Gemma3ImagePixelInputs", "vllm.model_executor.models.gemma3_mm.Gemma3MultiModalProcessor", "vllm.model_executor.models.gemma3_mm.Gemma3MultiModalProjector", "vllm.model_executor.models.gemma3_mm.Gemma3ProcessingInfo", "vllm.model_executor.models.gemma3_mm.logger" ], "n_typable": 102, "n_typed": 81, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 29, "n_method_overloads": 29, "n_method_params": 54, "n_classes": 6, "n_attrs": 19, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/gemma3n.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.gemma3n.Gemma3nMLP", "methods": [ { "kind": "function", "name": "Gemma3nMLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Gemma3nMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3nMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.gemma3n.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.gemma3n.EPS", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3n.Gemma3nSelfDecoder", "methods": [ { "kind": "function", "name": "Gemma3nSelfDecoder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Gemma3nSelfDecoder.get_per_layer_input_embeddings", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nSelfDecoder.get_per_layer_inputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3nSelfDecoder.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nSelfDecoder.altup_embed", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nSelfDecoder.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3nSelfDecoder.decoder_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nSelfDecoder.layer_idx_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nSelfDecoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nSelfDecoder.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nSelfDecoder.embed_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nSelfDecoder.embed_tokens_per_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nSelfDecoder.embed_scale_per_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nSelfDecoder.per_layer_model_projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nSelfDecoder.per_layer_projection_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nSelfDecoder.per_layer_input_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nSelfDecoder.per_layer_projection_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nSelfDecoder.altup_projections", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 18, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3n.Gemma3nLaurelBlock", "methods": [ { "kind": "function", "name": "Gemma3nLaurelBlock.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Gemma3nLaurelBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3nLaurelBlock.linear_left", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nLaurelBlock.linear_right", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nLaurelBlock.post_laurel_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3n.Gemma3nAltUp", "methods": [ { "kind": "function", "name": "Gemma3nAltUp.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Gemma3nAltUp._compute_router_modalities", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nAltUp.scale_corrected_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nAltUp.predict", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nAltUp.correct", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3nAltUp.altup_num_inputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAltUp.altup_active_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAltUp.altup_coef_clip", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAltUp.correction_coefs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAltUp.prediction_coefs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAltUp.modality_router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAltUp.router_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAltUp.router_input_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAltUp.correct_output_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 16, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3n.Gemma3nAttention", "methods": [ { "kind": "function", "name": "Gemma3nAttention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "Gemma3nAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3nAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.v_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.is_kv_shared", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 13, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3n.Gemma3nTextModel", "methods": [ { "kind": "function", "name": "Gemma3nTextModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3nTextModel.get_per_layer_input_embeddings", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nTextModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nTextModel.fast_prefill_forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Gemma3nTextModel.normal_forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Gemma3nTextModel.altup_unembed", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nTextModel.forward", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Gemma3nTextModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Gemma3nTextModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Gemma3nTextModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nTextModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nTextModel.altup_unembed_projections", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nTextModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nTextModel.fast_prefill_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nTextModel.self_decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nTextModel.cross_decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nTextModel.positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nTextModel.hidden_states", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nTextModel.per_layer_inputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 41, "n_typed": 26, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 22, "n_attrs": 10, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3n.Gemma3nForCausalLM", "methods": [ { "kind": "function", "name": "Gemma3nForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3nForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nForCausalLM.forward", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Gemma3nForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3nForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Gemma3nForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nForCausalLM.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 14, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 11, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3n.Gemma3nCrossDecoder", "methods": [ { "kind": "function", "name": "Gemma3nCrossDecoder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Gemma3nCrossDecoder.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3nCrossDecoder.decoder_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nCrossDecoder.layer_idx_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3n.Gemma3nDecoderLayer", "methods": [ { "kind": "function", "name": "Gemma3nDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Gemma3nDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3nDecoderLayer.altup_active_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nDecoderLayer.altup", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nDecoderLayer.laurel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nDecoderLayer.per_layer_input_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nDecoderLayer.per_layer_projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nDecoderLayer.pre_feedforward_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nDecoderLayer.post_feedforward_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nDecoderLayer.post_per_layer_input_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nDecoderLayer.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 9, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 13, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.gemma3n", "names": [ "vllm.model_executor.models.gemma3n.EPS", "vllm.model_executor.models.gemma3n.Gemma3nAltUp", "vllm.model_executor.models.gemma3n.Gemma3nAttention", "vllm.model_executor.models.gemma3n.Gemma3nCrossDecoder", "vllm.model_executor.models.gemma3n.Gemma3nDecoderLayer", "vllm.model_executor.models.gemma3n.Gemma3nForCausalLM", "vllm.model_executor.models.gemma3n.Gemma3nLaurelBlock", "vllm.model_executor.models.gemma3n.Gemma3nMLP", "vllm.model_executor.models.gemma3n.Gemma3nSelfDecoder", "vllm.model_executor.models.gemma3n.Gemma3nTextModel", "vllm.model_executor.models.gemma3n.logger" ], "n_typable": 211, "n_typed": 121, "n_any": 0, "n_untyped": 90, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 34, "n_method_overloads": 34, "n_method_params": 100, "n_classes": 9, "n_attrs": 77, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/gemma3n_audio_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.gemma3n_audio_utils.adjust_audio_features_to_expected_length", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.models.gemma3n_audio_utils", "names": [ "vllm.model_executor.models.gemma3n_audio_utils.adjust_audio_features_to_expected_length" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/gemma3n_mm.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.gemma3n_mm.TOKENS_PER_AUDIO", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3n_mm.Gemma3nMultimodalEmbedder", "methods": [ { "kind": "function", "name": "Gemma3nMultimodalEmbedder.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3nMultimodalEmbedder.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3nMultimodalEmbedder.multimodal_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nMultimodalEmbedder.eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nMultimodalEmbedder.vocab_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nMultimodalEmbedder.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nMultimodalEmbedder.text_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nMultimodalEmbedder.embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nMultimodalEmbedder.hard_embedding_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nMultimodalEmbedder.soft_embedding_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nMultimodalEmbedder.embedding_projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nMultimodalEmbedder.embedding_post_projection_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 5, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3n_mm.Gemma3nAudioInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3nAudioInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAudioInputs.input_features_padded", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nAudioInputs.input_features_mask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.gemma3n_mm.TOKENS_PER_IMAGE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3n_mm.Gemma3nMultiModalProcessor", "methods": [ { "kind": "function", "name": "Gemma3nMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Gemma3nMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3nMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Gemma3nMultiModalProcessor._apply_token_matches", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3nMultiModalProcessor._find_mm_placeholders", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 18, "n_typed": 18, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3n_mm.Gemma3nForConditionalGeneration", "methods": [ { "kind": "function", "name": "Gemma3nForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3nForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nForConditionalGeneration._parse_and_validate_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nForConditionalGeneration._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nForConditionalGeneration._process_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Gemma3nForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Gemma3nForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Gemma3nForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3nForConditionalGeneration.get_generation_prompt", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Gemma3nForConditionalGeneration.get_speech_to_text_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3nForConditionalGeneration.supported_languages", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Gemma3nForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Gemma3nForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nForConditionalGeneration.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nForConditionalGeneration.embed_vision", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nForConditionalGeneration.audio_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nForConditionalGeneration.embed_audio", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nForConditionalGeneration.language_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nForConditionalGeneration.per_layer_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 56, "n_typed": 45, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 30, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3n_mm.Gemma3nImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Gemma3nImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Gemma3nImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3n_mm.Gemma3nProcessingInfo", "methods": [ { "kind": "function", "name": "Gemma3nProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Gemma3nProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nProcessingInfo.get_feature_extractor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Gemma3nProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Gemma3nProcessingInfo.get_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Gemma3nProcessingInfo.get_image_repl", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Gemma3nProcessingInfo.get_audio_repl", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 16, "n_typed": 13, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.gemma3n_mm.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.gemma3n_mm.Gemma3nDummyInputsBuilder", "methods": [ { "kind": "function", "name": "Gemma3nDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Gemma3nDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.gemma3n_mm", "names": [ "vllm.model_executor.models.gemma3n_mm.Gemma3nAudioInputs", "vllm.model_executor.models.gemma3n_mm.Gemma3nDummyInputsBuilder", "vllm.model_executor.models.gemma3n_mm.Gemma3nForConditionalGeneration", "vllm.model_executor.models.gemma3n_mm.Gemma3nImagePixelInputs", "vllm.model_executor.models.gemma3n_mm.Gemma3nMultiModalProcessor", "vllm.model_executor.models.gemma3n_mm.Gemma3nMultimodalEmbedder", "vllm.model_executor.models.gemma3n_mm.Gemma3nProcessingInfo", "vllm.model_executor.models.gemma3n_mm.TOKENS_PER_AUDIO", "vllm.model_executor.models.gemma3n_mm.TOKENS_PER_IMAGE", "vllm.model_executor.models.gemma3n_mm.logger" ], "n_typable": 118, "n_typed": 92, "n_any": 0, "n_untyped": 26, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 32, "n_method_overloads": 32, "n_method_params": 59, "n_classes": 7, "n_attrs": 31, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/glm.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.glm.GlmForCausalLM", "methods": [ { "kind": "function", "name": "GlmForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.glm", "names": [ "vllm.model_executor.models.glm.GlmForCausalLM" ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/glm4.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.glm4.get_spec_layer_idx_from_weight_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.glm4.Glm4DecoderLayer", "methods": [ { "kind": "function", "name": "Glm4DecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Glm4DecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4DecoderLayer.post_self_attn_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4DecoderLayer.post_mlp_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 8, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4.Glm4Attention", "methods": [ { "kind": "function", "name": "Glm4Attention.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "Glm4Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 15, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 13, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4.Glm4Model", "methods": [ { "kind": "function", "name": "Glm4Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.glm4.ALL_DECODER_LAYER_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4.Glm4ForCausalLM", "methods": [ { "kind": "function", "name": "Glm4ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Glm4ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Glm4ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4ForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.glm4", "names": [ "vllm.model_executor.models.glm4.ALL_DECODER_LAYER_TYPES", "vllm.model_executor.models.glm4.Glm4Attention", "vllm.model_executor.models.glm4.Glm4DecoderLayer", "vllm.model_executor.models.glm4.Glm4ForCausalLM", "vllm.model_executor.models.glm4.Glm4Model", "vllm.model_executor.models.glm4.get_spec_layer_idx_from_weight_name" ], "n_typable": 71, "n_typed": 43, "n_any": 0, "n_untyped": 28, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 31, "n_classes": 4, "n_attrs": 28, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/glm4_1v.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vVisionTransformer", "methods": [ { "kind": "function", "name": "Glm4vVisionTransformer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Glm4vVisionTransformer.rot_pos_emb", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vVisionTransformer.compute_attn_mask_seqlen", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vVisionTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4vVisionTransformer.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Glm4vVisionTransformer.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Glm4vVisionTransformer.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Glm4vVisionTransformer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionTransformer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionTransformer.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionTransformer.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionTransformer.out_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionTransformer.patch_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionTransformer.rotary_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionTransformer.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionTransformer.merger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionTransformer.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionTransformer.post_conv_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionTransformer.downsample", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionTransformer.post_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionTransformer.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 16, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 14, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vPatchMerger", "methods": [ { "kind": "function", "name": "Glm4vPatchMerger.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Glm4vPatchMerger.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4vPatchMerger.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vPatchMerger.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vPatchMerger.post_projection_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vPatchMerger.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vPatchMerger.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vPatchMerger.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vPatchMerger.extra_activation_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 7, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.glm4_1v.all_gather_interleave", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vVideoPixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4vVideoPixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVideoPixelInputs.pixel_values_videos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVideoPixelInputs.video_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vVideoEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4vVideoEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVideoEmbeddingInputs.video_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVideoEmbeddingInputs.video_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vVisionEmbeddings", "methods": [ { "kind": "function", "name": "Glm4vVisionEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vVisionEmbeddings.forward", "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4vVisionEmbeddings.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionEmbeddings.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionEmbeddings.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionEmbeddings.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionEmbeddings.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionEmbeddings.num_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionEmbeddings.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 2, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vDummyInputsBuilder", "methods": [ { "kind": "function", "name": "Glm4vDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Glm4vDummyInputsBuilder._get_dummy_videos", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.glm4_1v.Glm4vVideoInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4vImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vImagePixelInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vMultiModalProcessor", "methods": [ { "kind": "function", "name": "Glm4vMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Glm4vMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4vMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vForConditionalGeneration", "methods": [ { "kind": "function", "name": "Glm4vForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4vForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4vForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vForConditionalGeneration._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vForConditionalGeneration._process_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vForConditionalGeneration._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vForConditionalGeneration.iter_mm_grid_thw", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vForConditionalGeneration.get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4vForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Glm4vForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Glm4vForConditionalGeneration.get_num_mm_encoder_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vForConditionalGeneration.get_num_mm_connector_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4vForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Glm4vForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vForConditionalGeneration.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Glm4vForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vForConditionalGeneration.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 45, "n_typed": 37, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 22, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vVisionAttention", "methods": [ { "kind": "function", "name": "Glm4vVisionAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Glm4vVisionAttention.split_qkv", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vVisionAttention.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4vVisionAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionAttention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionAttention.hidden_size_per_attention_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionAttention.num_attention_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionAttention.qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionAttention.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionAttention.apply_rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 14, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.glm4_1v.Glm4vImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vVisionMLP", "methods": [ { "kind": "function", "name": "Glm4vVisionMLP.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Glm4vVisionMLP.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4vVisionMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vVisionPatchEmbed", "methods": [ { "kind": "function", "name": "Glm4vVisionPatchEmbed.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Glm4vVisionPatchEmbed.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4vVisionPatchEmbed.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionPatchEmbed.temporal_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionPatchEmbed.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionPatchEmbed.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vMoeForConditionalGeneration", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4vMoeForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vProcessingInfo", "methods": [ { "kind": "function", "name": "Glm4vProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Glm4vProcessingInfo.get_image_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vProcessingInfo.get_video_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Glm4vProcessingInfo._get_vision_info", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Glm4vProcessingInfo._get_image_max_pixels", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Glm4vProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Glm4vProcessingInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4vProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Glm4vProcessingInfo.get_num_video_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Glm4vProcessingInfo._get_max_video_frames", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4vProcessingInfo.get_num_frames_with_most_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4vProcessingInfo._get_video_second_idx_glm4v", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4vProcessingInfo._get_video_second_idx_glm46v", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4vProcessingInfo._construct_video_placeholder", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 37, "n_typed": 36, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 22, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vVisionBlock", "methods": [ { "kind": "function", "name": "Glm4vVisionBlock.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Glm4vVisionBlock.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4vVisionBlock.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionBlock.norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vVisionBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 13, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.glm4_1v.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_1v.Glm4vImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4vImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vImageEmbeddingInputs.image_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4vImageEmbeddingInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.glm4_1v", "names": [ "vllm.model_executor.models.glm4_1v.Glm4vDummyInputsBuilder", "vllm.model_executor.models.glm4_1v.Glm4vForConditionalGeneration", "vllm.model_executor.models.glm4_1v.Glm4vImageEmbeddingInputs", "vllm.model_executor.models.glm4_1v.Glm4vImageInputs", "vllm.model_executor.models.glm4_1v.Glm4vImagePixelInputs", "vllm.model_executor.models.glm4_1v.Glm4vMoeForConditionalGeneration", "vllm.model_executor.models.glm4_1v.Glm4vMultiModalProcessor", "vllm.model_executor.models.glm4_1v.Glm4vPatchMerger", "vllm.model_executor.models.glm4_1v.Glm4vProcessingInfo", "vllm.model_executor.models.glm4_1v.Glm4vVideoEmbeddingInputs", "vllm.model_executor.models.glm4_1v.Glm4vVideoInputs", "vllm.model_executor.models.glm4_1v.Glm4vVideoPixelInputs", "vllm.model_executor.models.glm4_1v.Glm4vVisionAttention", "vllm.model_executor.models.glm4_1v.Glm4vVisionBlock", "vllm.model_executor.models.glm4_1v.Glm4vVisionEmbeddings", "vllm.model_executor.models.glm4_1v.Glm4vVisionMLP", "vllm.model_executor.models.glm4_1v.Glm4vVisionPatchEmbed", "vllm.model_executor.models.glm4_1v.Glm4vVisionTransformer", "vllm.model_executor.models.glm4_1v.all_gather_interleave", "vllm.model_executor.models.glm4_1v.logger" ], "n_typable": 246, "n_typed": 178, "n_any": 0, "n_untyped": 68, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 55, "n_method_overloads": 55, "n_method_params": 116, "n_classes": 16, "n_attrs": 72, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/glm4_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.glm4_moe.Glm4MoeForCausalLM", "methods": [ { "kind": "function", "name": "Glm4MoeForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4MoeForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Glm4MoeForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoeForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Glm4MoeForCausalLM.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Glm4MoeForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeForCausalLM.expert_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeForCausalLM.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeForCausalLM.num_expert_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeForCausalLM.moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeForCausalLM.moe_mlp_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 15, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_attrs": 13, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.glm4_moe.get_spec_layer_idx_from_weight_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe.Glm4MixtureOfExperts", "methods": [ { "kind": "function", "name": "Glm4MixtureOfExperts.extract_moe_parameters", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MixtureOfExperts.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe.Glm4MoeMLP", "methods": [ { "kind": "function", "name": "Glm4MoeMLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Glm4MoeMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoeMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe.Glm4MoE", "methods": [ { "kind": "function", "name": "Glm4MoE.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Glm4MoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.n_routed_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.n_shared_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoE.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 8, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe.Glm4MoeDecoderLayer", "methods": [ { "kind": "function", "name": "Glm4MoeDecoderLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Glm4MoeDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoeDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeDecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeDecoderLayer.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 10, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe.Glm4MoeAttention", "methods": [ { "kind": "function", "name": "Glm4MoeAttention.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "Glm4MoeAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoeAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.use_qk_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeAttention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 16, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 14, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe.Glm4MoeModel", "methods": [ { "kind": "function", "name": "Glm4MoeModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4MoeModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Glm4MoeModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Glm4MoeModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoeModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 12, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.glm4_moe.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.glm4_moe", "names": [ "vllm.model_executor.models.glm4_moe.Glm4MixtureOfExperts", "vllm.model_executor.models.glm4_moe.Glm4MoE", "vllm.model_executor.models.glm4_moe.Glm4MoeAttention", "vllm.model_executor.models.glm4_moe.Glm4MoeDecoderLayer", "vllm.model_executor.models.glm4_moe.Glm4MoeForCausalLM", "vllm.model_executor.models.glm4_moe.Glm4MoeMLP", "vllm.model_executor.models.glm4_moe.Glm4MoeModel", "vllm.model_executor.models.glm4_moe.get_spec_layer_idx_from_weight_name", "vllm.model_executor.models.glm4_moe.logger" ], "n_typable": 139, "n_typed": 76, "n_any": 0, "n_untyped": 63, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 54, "n_classes": 7, "n_attrs": 63, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/glm4_moe_lite.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_lite.Glm4MoeLite", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.glm4_moe_lite.get_spec_layer_idx_from_weight_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_lite.Glm4MoeLiteDecoderLayer", "methods": [ { "kind": "function", "name": "Glm4MoeLiteDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Glm4MoeLiteDecoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoeLiteDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteDecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteDecoderLayer.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 10, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_lite.Glm4MoeLiteMLAAttention", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_lite.Glm4MoeLiteMLP", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_lite.Glm4LiteMixtureOfExperts", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_lite.Glm4MoeLiteForCausalLM", "methods": [ { "kind": "function", "name": "Glm4MoeLiteForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4MoeLiteForCausalLM.set_moe_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Glm4MoeLiteForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeLiteForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Glm4MoeLiteForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeLiteForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Glm4MoeLiteForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoeLiteForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Glm4MoeLiteForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteForCausalLM.use_mha", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteForCausalLM.fuse_qkv_a_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteForCausalLM.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 14, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 9, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.glm4_moe_lite.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_lite.Glm4MoeLiteAttention", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_lite.Glm4MoeLiteModel", "methods": [ { "kind": "function", "name": "Glm4MoeLiteModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4MoeLiteModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeLiteModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Glm4MoeLiteModel.make_empty_intermediate_tensors", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Glm4MoeLiteModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Glm4MoeLiteModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoeLiteModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteModel.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteModel.is_v32", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 16, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 11, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.glm4_moe_lite", "names": [ "vllm.model_executor.models.glm4_moe_lite.Glm4LiteMixtureOfExperts", "vllm.model_executor.models.glm4_moe_lite.Glm4MoeLite", "vllm.model_executor.models.glm4_moe_lite.Glm4MoeLiteAttention", "vllm.model_executor.models.glm4_moe_lite.Glm4MoeLiteDecoderLayer", "vllm.model_executor.models.glm4_moe_lite.Glm4MoeLiteForCausalLM", "vllm.model_executor.models.glm4_moe_lite.Glm4MoeLiteMLAAttention", "vllm.model_executor.models.glm4_moe_lite.Glm4MoeLiteMLP", "vllm.model_executor.models.glm4_moe_lite.Glm4MoeLiteModel", "vllm.model_executor.models.glm4_moe_lite.get_spec_layer_idx_from_weight_name", "vllm.model_executor.models.glm4_moe_lite.logger" ], "n_typable": 70, "n_typed": 43, "n_any": 0, "n_untyped": 27, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 28, "n_classes": 8, "n_attrs": 25, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/glm4_moe_lite_mtp.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_lite_mtp.SharedHead", "methods": [ { "kind": "function", "name": "SharedHead.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SharedHead.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SharedHead.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SharedHead.head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_lite_mtp.Glm4MoeLiteMultiTokenPredictor", "methods": [ { "kind": "function", "name": "Glm4MoeLiteMultiTokenPredictor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4MoeLiteMultiTokenPredictor.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeLiteMultiTokenPredictor.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Glm4MoeLiteMultiTokenPredictor.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoeLiteMultiTokenPredictor.mtp_start_layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMultiTokenPredictor.num_mtp_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMultiTokenPredictor.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMultiTokenPredictor.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMultiTokenPredictor.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 13, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_lite_mtp.Glm4MoeLiteMTP", "methods": [ { "kind": "function", "name": "Glm4MoeLiteMTP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4MoeLiteMTP.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeLiteMTP.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Glm4MoeLiteMTP.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4MoeLiteMTP.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeLiteMTP._rewrite_spec_layer_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoeLiteMTP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMTP.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMTP.expert_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMTP.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMTP.num_expert_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMTP.moe_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMTP.moe_mlp_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 27, "n_typed": 21, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_lite_mtp.Glm4MoeLiteMultiTokenPredictorLayer", "methods": [ { "kind": "function", "name": "Glm4MoeLiteMultiTokenPredictorLayer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4MoeLiteMultiTokenPredictorLayer.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoeLiteMultiTokenPredictorLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMultiTokenPredictorLayer.enorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMultiTokenPredictorLayer.hnorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMultiTokenPredictorLayer.eh_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMultiTokenPredictorLayer.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMultiTokenPredictorLayer.is_v32", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMultiTokenPredictorLayer.shared_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeLiteMultiTokenPredictorLayer.mtp_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 8, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.glm4_moe_lite_mtp", "names": [ "vllm.model_executor.models.glm4_moe_lite_mtp.Glm4MoeLiteMTP", "vllm.model_executor.models.glm4_moe_lite_mtp.Glm4MoeLiteMultiTokenPredictor", "vllm.model_executor.models.glm4_moe_lite_mtp.Glm4MoeLiteMultiTokenPredictorLayer", "vllm.model_executor.models.glm4_moe_lite_mtp.SharedHead" ], "n_typable": 71, "n_typed": 48, "n_any": 0, "n_untyped": 23, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 35, "n_classes": 4, "n_attrs": 22, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/glm4_moe_mtp.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_mtp.SharedHead", "methods": [ { "kind": "function", "name": "SharedHead.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SharedHead.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SharedHead.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SharedHead.head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_mtp.Glm4MoeMultiTokenPredictorLayer", "methods": [ { "kind": "function", "name": "Glm4MoeMultiTokenPredictorLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Glm4MoeMultiTokenPredictorLayer.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoeMultiTokenPredictorLayer.enorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMultiTokenPredictorLayer.hnorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMultiTokenPredictorLayer.eh_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMultiTokenPredictorLayer.shared_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMultiTokenPredictorLayer.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMultiTokenPredictorLayer.mtp_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 12, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_mtp.Glm4MoeMultiTokenPredictor", "methods": [ { "kind": "function", "name": "Glm4MoeMultiTokenPredictor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4MoeMultiTokenPredictor.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeMultiTokenPredictor.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Glm4MoeMultiTokenPredictor.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoeMultiTokenPredictor.mtp_start_layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMultiTokenPredictor.num_mtp_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMultiTokenPredictor.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMultiTokenPredictor.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMultiTokenPredictor.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 13, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4_moe_mtp.Glm4MoeMTP", "methods": [ { "kind": "function", "name": "Glm4MoeMTP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4MoeMTP.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeMTP.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Glm4MoeMTP.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4MoeMTP.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeMTP._rewrite_spec_layer_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoeMTP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMTP.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMTP.expert_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMTP.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMTP.num_expert_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMTP.moe_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeMTP.moe_mlp_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 27, "n_typed": 21, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.glm4_moe_mtp", "names": [ "vllm.model_executor.models.glm4_moe_mtp.Glm4MoeMTP", "vllm.model_executor.models.glm4_moe_mtp.Glm4MoeMultiTokenPredictor", "vllm.model_executor.models.glm4_moe_mtp.Glm4MoeMultiTokenPredictorLayer", "vllm.model_executor.models.glm4_moe_mtp.SharedHead" ], "n_typable": 72, "n_typed": 52, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 38, "n_classes": 4, "n_attrs": 20, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/glm4v.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.glm4v.GLMVImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "GLMVImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GLMVImagePixelInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4v.EVA2CLIPTransformer", "methods": [ { "kind": "function", "name": "EVA2CLIPTransformer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EVA2CLIPTransformer.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EVA2CLIPTransformer.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 2, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4v.GLM4VForCausalLM", "methods": [ { "kind": "function", "name": "GLM4VForCausalLM.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GLM4VForCausalLM.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GLM4VForCausalLM.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GLM4VForCausalLM._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GLM4VForCausalLM._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GLM4VForCausalLM.iter_mm_grid_thw", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GLM4VForCausalLM.get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GLM4VForCausalLM.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GLM4VForCausalLM.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GLM4VForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GLM4VForCausalLM.transformer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GLM4VForCausalLM.embed_input_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 26, "n_typed": 26, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 16, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4v.GLM4VDummyInputsBuilder", "methods": [ { "kind": "function", "name": "GLM4VDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GLM4VDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4v.EVA2CLIPModel", "methods": [ { "kind": "function", "name": "EVA2CLIPModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EVA2CLIPModel.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EVA2CLIPModel.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPModel.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPModel.linear_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPModel.conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPModel.boi", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPModel.eoi", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPModel.scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 4, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4v.EVA2CLIPTransformerLayer", "methods": [ { "kind": "function", "name": "EVA2CLIPTransformerLayer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EVA2CLIPTransformerLayer.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EVA2CLIPTransformerLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPTransformerLayer.attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPTransformerLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPTransformerLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 2, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4v.GLM4VModel", "methods": [ { "kind": "function", "name": "GLM4VModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GLM4VModel.vision", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4v.EVA2CLIPPatchEmbedding", "methods": [ { "kind": "function", "name": "EVA2CLIPPatchEmbedding.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EVA2CLIPPatchEmbedding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EVA2CLIPPatchEmbedding.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPPatchEmbedding.cls_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPPatchEmbedding.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 2, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4v.GLM4VProcessingInfo", "methods": [ { "kind": "function", "name": "GLM4VProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GLM4VProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GLM4VProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GLM4VProcessingInfo.get_num_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GLM4VProcessingInfo.get_num_image_feature_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4v.EVA2CLIPAttention", "methods": [ { "kind": "function", "name": "EVA2CLIPAttention.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EVA2CLIPAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EVA2CLIPAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPAttention.num_heads_per_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPAttention.query_key_value", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPAttention.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPAttention.output_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 4, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4v.GLM4VProcessor", "methods": [ { "kind": "function", "name": "GLM4VProcessor.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GLM4VProcessor.__call__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GLM4VProcessor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLM4VProcessor.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLM4VProcessor.image_transform", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 7, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4v.EVA2CLIPMLP", "methods": [ { "kind": "function", "name": "EVA2CLIPMLP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EVA2CLIPMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EVA2CLIPMLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPMLP.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 4, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4v.EVA2CLIPGLU", "methods": [ { "kind": "function", "name": "EVA2CLIPGLU.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EVA2CLIPGLU.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EVA2CLIPGLU.linear_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPGLU.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPGLU.act1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPGLU.act2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPGLU.merged_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EVA2CLIPGLU.dense_4h_to_h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 2, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm4v.GLM4VMultiModalProcessor", "methods": [ { "kind": "function", "name": "GLM4VMultiModalProcessor._hf_processor_applies_updates", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GLM4VMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GLM4VMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.glm4v", "names": [ "vllm.model_executor.models.glm4v.EVA2CLIPAttention", "vllm.model_executor.models.glm4v.EVA2CLIPGLU", "vllm.model_executor.models.glm4v.EVA2CLIPMLP", "vllm.model_executor.models.glm4v.EVA2CLIPModel", "vllm.model_executor.models.glm4v.EVA2CLIPPatchEmbedding", "vllm.model_executor.models.glm4v.EVA2CLIPTransformer", "vllm.model_executor.models.glm4v.EVA2CLIPTransformerLayer", "vllm.model_executor.models.glm4v.GLM4VDummyInputsBuilder", "vllm.model_executor.models.glm4v.GLM4VForCausalLM", "vllm.model_executor.models.glm4v.GLM4VModel", "vllm.model_executor.models.glm4v.GLM4VMultiModalProcessor", "vllm.model_executor.models.glm4v.GLM4VProcessingInfo", "vllm.model_executor.models.glm4v.GLM4VProcessor", "vllm.model_executor.models.glm4v.GLMVImagePixelInputs" ], "n_typable": 141, "n_typed": 80, "n_any": 0, "n_untyped": 61, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 36, "n_method_overloads": 36, "n_method_params": 64, "n_classes": 14, "n_attrs": 43, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/glm_ocr.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.glm_ocr.GlmOcrPatchMerger", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm_ocr.GlmOcrVisionPatchEmbed", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm_ocr.GlmOcrVisionBlock", "methods": [ { "kind": "function", "name": "GlmOcrVisionBlock.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmOcrVisionBlock.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionBlock.norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm_ocr.GlmOcrVisionTransformer", "methods": [ { "kind": "function", "name": "GlmOcrVisionTransformer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GlmOcrVisionTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmOcrVisionTransformer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionTransformer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionTransformer.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionTransformer.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionTransformer.out_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionTransformer.patch_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionTransformer.rotary_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionTransformer.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionTransformer.merger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionTransformer.downsample", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionTransformer.post_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionTransformer.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 8, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm_ocr.GlmOcrVisionMLP", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm_ocr.GlmOcrForConditionalGeneration", "methods": [ { "kind": "function", "name": "GlmOcrForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmOcrForConditionalGeneration.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.glm_ocr.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.glm_ocr.GlmOcrVisionAttention", "methods": [ { "kind": "function", "name": "GlmOcrVisionAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "GlmOcrVisionAttention.split_qkv", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GlmOcrVisionAttention.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmOcrVisionAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionAttention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionAttention.hidden_size_per_attention_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionAttention.num_attention_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionAttention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionAttention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionAttention.qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionAttention.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrVisionAttention.apply_rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 14, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 11, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.glm_ocr", "names": [ "vllm.model_executor.models.glm_ocr.GlmOcrForConditionalGeneration", "vllm.model_executor.models.glm_ocr.GlmOcrPatchMerger", "vllm.model_executor.models.glm_ocr.GlmOcrVisionAttention", "vllm.model_executor.models.glm_ocr.GlmOcrVisionBlock", "vllm.model_executor.models.glm_ocr.GlmOcrVisionMLP", "vllm.model_executor.models.glm_ocr.GlmOcrVisionPatchEmbed", "vllm.model_executor.models.glm_ocr.GlmOcrVisionTransformer", "vllm.model_executor.models.glm_ocr.logger" ], "n_typable": 61, "n_typed": 31, "n_any": 0, "n_untyped": 30, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 25, "n_classes": 7, "n_attrs": 29, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/glm_ocr_mtp.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.glm_ocr_mtp.GlmOcrMTP", "methods": [ { "kind": "function", "name": "GlmOcrMTP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GlmOcrMTP.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GlmOcrMTP.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "GlmOcrMTP.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GlmOcrMTP.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GlmOcrMTP._rewrite_spec_layer_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmOcrMTP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrMTP.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrMTP.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrMTP.expert_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrMTP.num_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 19, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm_ocr_mtp.GlmOcrMultiTokenPredictorLayer", "methods": [ { "kind": "function", "name": "GlmOcrMultiTokenPredictorLayer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GlmOcrMultiTokenPredictorLayer.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmOcrMultiTokenPredictorLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrMultiTokenPredictorLayer.enorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrMultiTokenPredictorLayer.hnorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrMultiTokenPredictorLayer.eh_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrMultiTokenPredictorLayer.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrMultiTokenPredictorLayer.shared_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrMultiTokenPredictorLayer.mtp_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 8, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glm_ocr_mtp.GlmOcrMultiTokenPredictor", "methods": [ { "kind": "function", "name": "GlmOcrMultiTokenPredictor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmOcrMultiTokenPredictor.mtp_start_layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrMultiTokenPredictor.num_mtp_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrMultiTokenPredictor.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrMultiTokenPredictor.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmOcrMultiTokenPredictor.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 2, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.glm_ocr_mtp", "names": [ "vllm.model_executor.models.glm_ocr_mtp.GlmOcrMTP", "vllm.model_executor.models.glm_ocr_mtp.GlmOcrMultiTokenPredictor", "vllm.model_executor.models.glm_ocr_mtp.GlmOcrMultiTokenPredictorLayer" ], "n_typable": 49, "n_typed": 29, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 23, "n_classes": 3, "n_attrs": 17, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/glmasr.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.glmasr.GlmAsrEncoderLayer", "methods": [ { "kind": "function", "name": "GlmAsrEncoderLayer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GlmAsrEncoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmAsrEncoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 6, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glmasr.GlmAsrEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmAsrEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEmbeddingInputs.audio_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glmasr.GlmAsrEncoderAttention", "methods": [ { "kind": "function", "name": "GlmAsrEncoderAttention.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GlmAsrEncoderAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmAsrEncoderAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderAttention.num_heads_per_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderAttention.num_kv_heads_per_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderAttention.rotary_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderAttention.apply_rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 6, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glmasr.GlmAsrEncoderMLP", "methods": [ { "kind": "function", "name": "GlmAsrEncoderMLP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GlmAsrEncoderMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmAsrEncoderMLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderMLP.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderMLP.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 4, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glmasr.GlmAsrEncoderRotaryEmbedding", "methods": [ { "kind": "function", "name": "GlmAsrEncoderRotaryEmbedding.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GlmAsrEncoderRotaryEmbedding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmAsrEncoderRotaryEmbedding.dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderRotaryEmbedding.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoderRotaryEmbedding.attention_scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 3, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glmasr.GlmAsrMultiModalProjector", "methods": [ { "kind": "function", "name": "GlmAsrMultiModalProjector.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GlmAsrMultiModalProjector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmAsrMultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrMultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrMultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 5, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.glmasr.GlmAsrInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.glmasr.GlmAsrMultiModalDataParser", "methods": [ { "kind": "function", "name": "GlmAsrMultiModalDataParser._parse_audio_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glmasr.GlmAsrForConditionalGeneration", "methods": [ { "kind": "function", "name": "GlmAsrForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GlmAsrForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GlmAsrForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GlmAsrForConditionalGeneration._parse_and_validate_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GlmAsrForConditionalGeneration._process_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GlmAsrForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GlmAsrForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "GlmAsrForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GlmAsrForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GlmAsrForConditionalGeneration._get_audio_token", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GlmAsrForConditionalGeneration.get_speech_to_text_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GlmAsrForConditionalGeneration.get_generation_prompt", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmAsrForConditionalGeneration.supported_languages", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GlmAsrForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GlmAsrForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrForConditionalGeneration.audio_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 43, "n_typed": 35, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 24, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glmasr.GlmAsrFeatureInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmAsrFeatureInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrFeatureInputs.input_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrFeatureInputs.feature_attention_mask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrFeatureInputs.chunk_counts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glmasr.GlmAsrMultiModalProcessor", "methods": [ { "kind": "function", "name": "GlmAsrMultiModalProcessor._calculate_chunk_counts", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GlmAsrMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GlmAsrMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GlmAsrMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glmasr.GlmAsrProcessingInfo", "methods": [ { "kind": "function", "name": "GlmAsrProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GlmAsrProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GlmAsrProcessingInfo.get_feature_extractor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GlmAsrProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GlmAsrProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glmasr.GlmAsrDummyInputsBuilder", "methods": [ { "kind": "function", "name": "GlmAsrDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GlmAsrDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.glmasr.GlmAsrEncoder", "methods": [ { "kind": "function", "name": "GlmAsrEncoder.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GlmAsrEncoder._get_feat_extract_output_lengths", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GlmAsrEncoder.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GlmAsrEncoder.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GlmAsrEncoder.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GlmAsrEncoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoder.conv1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoder.conv2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoder.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GlmAsrEncoder.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 8, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.glmasr", "names": [ "vllm.model_executor.models.glmasr.GlmAsrDummyInputsBuilder", "vllm.model_executor.models.glmasr.GlmAsrEmbeddingInputs", "vllm.model_executor.models.glmasr.GlmAsrEncoder", "vllm.model_executor.models.glmasr.GlmAsrEncoderAttention", "vllm.model_executor.models.glmasr.GlmAsrEncoderLayer", "vllm.model_executor.models.glmasr.GlmAsrEncoderMLP", "vllm.model_executor.models.glmasr.GlmAsrEncoderRotaryEmbedding", "vllm.model_executor.models.glmasr.GlmAsrFeatureInputs", "vllm.model_executor.models.glmasr.GlmAsrForConditionalGeneration", "vllm.model_executor.models.glmasr.GlmAsrInputs", "vllm.model_executor.models.glmasr.GlmAsrMultiModalDataParser", "vllm.model_executor.models.glmasr.GlmAsrMultiModalProcessor", "vllm.model_executor.models.glmasr.GlmAsrMultiModalProjector", "vllm.model_executor.models.glmasr.GlmAsrProcessingInfo" ], "n_typable": 159, "n_typed": 104, "n_any": 0, "n_untyped": 55, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 38, "n_method_overloads": 38, "n_method_params": 71, "n_classes": 13, "n_attrs": 53, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/glmasr_utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.glmasr_utils.DEFAULT_MAX_AUDIO_LEN_S", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.glmasr_utils.DEFAULT_CONV_PARAMS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.glmasr_utils.DEFAULT_MERGE_FACTOR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.glmasr_utils", "names": [ "vllm.model_executor.models.glmasr_utils.DEFAULT_CONV_PARAMS", "vllm.model_executor.models.glmasr_utils.DEFAULT_MAX_AUDIO_LEN_S", "vllm.model_executor.models.glmasr_utils.DEFAULT_MERGE_FACTOR" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/gpt2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.gpt2.GPT2LMHeadModel", "methods": [ { "kind": "function", "name": "GPT2LMHeadModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPT2LMHeadModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPT2LMHeadModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPT2LMHeadModel.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPT2LMHeadModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPT2LMHeadModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2LMHeadModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2LMHeadModel.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2LMHeadModel.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2LMHeadModel.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2LMHeadModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt2.GPT2Block", "methods": [ { "kind": "function", "name": "GPT2Block.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPT2Block.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPT2Block.ln_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2Block.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2Block.ln_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2Block.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt2.GPT2ForSequenceClassification", "methods": [ { "kind": "function", "name": "GPT2ForSequenceClassification.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPT2ForSequenceClassification.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPT2ForSequenceClassification.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPT2ForSequenceClassification.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPT2ForSequenceClassification.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GPT2ForSequenceClassification.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2ForSequenceClassification.score", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2ForSequenceClassification.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt2.GPT2MLP", "methods": [ { "kind": "function", "name": "GPT2MLP.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPT2MLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPT2MLP.c_fc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2MLP.c_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2MLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt2.GPT2Attention", "methods": [ { "kind": "function", "name": "GPT2Attention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPT2Attention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPT2Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2Attention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2Attention.c_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2Attention.c_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 6, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt2.GPT2Model", "methods": [ { "kind": "function", "name": "GPT2Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPT2Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPT2Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPT2Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPT2Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2Model.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2Model.wte", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2Model.wpe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2Model.ln_f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPT2Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.gpt2", "names": [ "vllm.model_executor.models.gpt2.GPT2Attention", "vllm.model_executor.models.gpt2.GPT2Block", "vllm.model_executor.models.gpt2.GPT2ForSequenceClassification", "vllm.model_executor.models.gpt2.GPT2LMHeadModel", "vllm.model_executor.models.gpt2.GPT2MLP", "vllm.model_executor.models.gpt2.GPT2Model" ], "n_typable": 88, "n_typed": 52, "n_any": 0, "n_untyped": 36, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 40, "n_classes": 6, "n_attrs": 30, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/gpt_bigcode.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.gpt_bigcode.GPTBigMLP", "methods": [ { "kind": "function", "name": "GPTBigMLP.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPTBigMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTBigMLP.c_fc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigMLP.c_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_bigcode.GPTBigCodeForCausalLM", "methods": [ { "kind": "function", "name": "GPTBigCodeForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPTBigCodeForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTBigCodeForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPTBigCodeForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTBigCodeForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTBigCodeForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GPTBigCodeForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeForCausalLM.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_bigcode.GPTBigCodeBlock", "methods": [ { "kind": "function", "name": "GPTBigCodeBlock.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPTBigCodeBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTBigCodeBlock.ln_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeBlock.ln_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_bigcode.GPTBigCodeModel", "methods": [ { "kind": "function", "name": "GPTBigCodeModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPTBigCodeModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTBigCodeModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPTBigCodeModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTBigCodeModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeModel.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeModel.wte", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeModel.wpe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeModel.ln_f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 11, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_bigcode.GPTBigCodeAttention", "methods": [ { "kind": "function", "name": "GPTBigCodeAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPTBigCodeAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTBigCodeAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeAttention.tensor_model_parallel_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeAttention.multi_query", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeAttention.kv_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeAttention.c_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeAttention.c_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTBigCodeAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 6, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 11, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.gpt_bigcode", "names": [ "vllm.model_executor.models.gpt_bigcode.GPTBigCodeAttention", "vllm.model_executor.models.gpt_bigcode.GPTBigCodeBlock", "vllm.model_executor.models.gpt_bigcode.GPTBigCodeForCausalLM", "vllm.model_executor.models.gpt_bigcode.GPTBigCodeModel", "vllm.model_executor.models.gpt_bigcode.GPTBigMLP" ], "n_typable": 78, "n_typed": 42, "n_any": 0, "n_untyped": 36, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 32, "n_classes": 5, "n_attrs": 32, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/gpt_j.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.gpt_j.GPTJForCausalLM", "methods": [ { "kind": "function", "name": "GPTJForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPTJForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTJForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPTJForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTJForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTJForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJForCausalLM.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_j.GPTJMLP", "methods": [ { "kind": "function", "name": "GPTJMLP.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPTJMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTJMLP.fc_in", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJMLP.fc_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_j.GPTJModel", "methods": [ { "kind": "function", "name": "GPTJModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPTJModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTJModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPTJModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTJModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJModel.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJModel.wte", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJModel.ln_f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_j.GPTJBlock", "methods": [ { "kind": "function", "name": "GPTJBlock.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPTJBlock.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTJBlock.ln_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_j.GPTJAttention", "methods": [ { "kind": "function", "name": "GPTJAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPTJAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTJAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJAttention.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTJAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 7, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.gpt_j", "names": [ "vllm.model_executor.models.gpt_j.GPTJAttention", "vllm.model_executor.models.gpt_j.GPTJBlock", "vllm.model_executor.models.gpt_j.GPTJForCausalLM", "vllm.model_executor.models.gpt_j.GPTJMLP", "vllm.model_executor.models.gpt_j.GPTJModel" ], "n_typable": 75, "n_typed": 44, "n_any": 0, "n_untyped": 31, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 34, "n_classes": 5, "n_attrs": 26, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/gpt_neox.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.gpt_neox.GPTNeoXAttention", "methods": [ { "kind": "function", "name": "GPTNeoXAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPTNeoXAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTNeoXAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXAttention.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXAttention.bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXAttention.query_key_value", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXAttention.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 7, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_neox.GPTNeoXMLP", "methods": [ { "kind": "function", "name": "GPTNeoXMLP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GPTNeoXMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTNeoXMLP.dense_h_to_4h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXMLP.dense_4h_to_h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 3, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_neox.GPTNeoXModel", "methods": [ { "kind": "function", "name": "GPTNeoXModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPTNeoXModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTNeoXModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPTNeoXModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTNeoXModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXModel.embed_in", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXModel.final_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_neox.GPTNeoXLayer", "methods": [ { "kind": "function", "name": "GPTNeoXLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPTNeoXLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTNeoXLayer.use_parallel_residual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXLayer.attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 7, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_neox.GPTNeoXForCausalLM", "methods": [ { "kind": "function", "name": "GPTNeoXForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPTNeoXForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTNeoXForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPTNeoXForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPTNeoXForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPTNeoXForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXForCausalLM.gpt_neox", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXForCausalLM.embed_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPTNeoXForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.gpt_neox", "names": [ "vllm.model_executor.models.gpt_neox.GPTNeoXAttention", "vllm.model_executor.models.gpt_neox.GPTNeoXForCausalLM", "vllm.model_executor.models.gpt_neox.GPTNeoXLayer", "vllm.model_executor.models.gpt_neox.GPTNeoXMLP", "vllm.model_executor.models.gpt_neox.GPTNeoXModel" ], "n_typable": 75, "n_typed": 41, "n_any": 0, "n_untyped": 34, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 33, "n_classes": 5, "n_attrs": 27, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/gpt_oss.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.gpt_oss.TransformerBlock", "methods": [ { "kind": "function", "name": "TransformerBlock.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TransformerBlock.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TransformerBlock.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerBlock.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerBlock.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 7, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_oss.OAIAttention", "methods": [ { "kind": "function", "name": "OAIAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OAIAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OAIAttention.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OAIAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OAIAttention.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OAIAttention.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OAIAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OAIAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OAIAttention.sinks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OAIAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OAIAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OAIAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OAIAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OAIAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OAIAttention.num_local_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OAIAttention.num_local_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OAIAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 7, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_oss.MLPBlock", "methods": [ { "kind": "function", "name": "MLPBlock.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MLPBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MLPBlock.is_sequence_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPBlock.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPBlock.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPBlock.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPBlock.experts_per_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPBlock.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPBlock.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPBlock.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 5, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_oss.GptOssModel", "methods": [ { "kind": "function", "name": "GptOssModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GptOssModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GptOssModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GptOssModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GptOssModel._load_weights_mxfp4", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "GptOssModel._load_weights_quark", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "GptOssModel._load_weights_other", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "GptOssModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GptOssModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GptOssModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GptOssModel.parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GptOssModel.embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GptOssModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GptOssModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GptOssModel.aux_hidden_state_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 41, "n_typed": 33, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 26, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gpt_oss.GptOssForCausalLM", "methods": [ { "kind": "function", "name": "GptOssForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GptOssForCausalLM.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GptOssForCausalLM.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GptOssForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GptOssForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GptOssForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GptOssForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GptOssForCausalLM.is_3d_moe_weight", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GptOssForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GptOssForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GptOssForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GptOssForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GptOssForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GptOssForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GptOssForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GptOssForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 17, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 10, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.gpt_oss", "names": [ "vllm.model_executor.models.gpt_oss.GptOssForCausalLM", "vllm.model_executor.models.gpt_oss.GptOssModel", "vllm.model_executor.models.gpt_oss.MLPBlock", "vllm.model_executor.models.gpt_oss.OAIAttention", "vllm.model_executor.models.gpt_oss.TransformerBlock" ], "n_typable": 116, "n_typed": 69, "n_any": 0, "n_untyped": 47, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 52, "n_classes": 5, "n_attrs": 44, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/granite.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.granite.GraniteAttention", "methods": [ { "kind": "function", "name": "GraniteAttention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "GraniteAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 13, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granite.GraniteDecoderLayer", "methods": [ { "kind": "function", "name": "GraniteDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GraniteDecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteDecoderLayer.residual_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 8, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granite.GraniteMLP", "methods": [ { "kind": "function", "name": "GraniteMLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "GraniteMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granite.GraniteForCausalLM", "methods": [ { "kind": "function", "name": "GraniteForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GraniteForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteForCausalLM.make_empty_intermediate_tensors", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GraniteForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GraniteForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GraniteForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 17, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granite.GraniteModel", "methods": [ { "kind": "function", "name": "GraniteModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GraniteModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.granite", "names": [ "vllm.model_executor.models.granite.GraniteAttention", "vllm.model_executor.models.granite.GraniteDecoderLayer", "vllm.model_executor.models.granite.GraniteForCausalLM", "vllm.model_executor.models.granite.GraniteMLP", "vllm.model_executor.models.granite.GraniteModel" ], "n_typable": 92, "n_typed": 56, "n_any": 0, "n_untyped": 36, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 44, "n_classes": 5, "n_attrs": 34, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/granite_speech.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.granite_speech.GraniteSpeechMultiModalProcessor", "methods": [ { "kind": "function", "name": "GraniteSpeechMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteSpeechMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GraniteSpeechMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granite_speech.GraniteSpeechConformerAttention", "methods": [ { "kind": "function", "name": "GraniteSpeechConformerAttention.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteSpeechConformerAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteSpeechConformerAttention.max_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerAttention.context_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerAttention.dim_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerAttention.pre_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerAttention.to_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerAttention.to_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerAttention.to_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerAttention.rel_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 5, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.granite_speech.ISO639_1_SUPPORTED_LANGS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granite_speech.GraniteSpeechAudioInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteSpeechAudioInputs.input_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechAudioInputs.input_features_mask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechAudioInputs.audio_embed_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granite_speech.GraniteSpeechEncoderProjector", "methods": [ { "kind": "function", "name": "GraniteSpeechEncoderProjector.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GraniteSpeechEncoderProjector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteSpeechEncoderProjector.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechEncoderProjector.downsample_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechEncoderProjector.window_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechEncoderProjector.num_queries", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechEncoderProjector.query", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechEncoderProjector.qformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechEncoderProjector.linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 6, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granite_speech.GraniteSpeechMultiModalProcessingInfo", "methods": [ { "kind": "function", "name": "GraniteSpeechMultiModalProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GraniteSpeechMultiModalProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GraniteSpeechMultiModalProcessingInfo.get_max_audio_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GraniteSpeechMultiModalProcessingInfo.get_max_audio_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granite_speech.GraniteSpeechConformerFeedForward", "methods": [ { "kind": "function", "name": "GraniteSpeechConformerFeedForward.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GraniteSpeechConformerFeedForward.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteSpeechConformerFeedForward.pre_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerFeedForward.up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerFeedForward.silu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerFeedForward.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granite_speech.GraniteSpeechForConditionalGeneration", "methods": [ { "kind": "function", "name": "GraniteSpeechForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteSpeechForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteSpeechForConditionalGeneration._parse_and_validate_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteSpeechForConditionalGeneration._build_input_features_mask", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteSpeechForConditionalGeneration._pad_and_stack_input_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteSpeechForConditionalGeneration._process_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteSpeechForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteSpeechForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GraniteSpeechForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "GraniteSpeechForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteSpeechForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteSpeechForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GraniteSpeechForConditionalGeneration.get_generation_prompt", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "GraniteSpeechForConditionalGeneration.get_num_audio_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GraniteSpeechForConditionalGeneration.get_speech_to_text_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteSpeechForConditionalGeneration.supported_languages", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GraniteSpeechForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GraniteSpeechForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechForConditionalGeneration.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechForConditionalGeneration.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechForConditionalGeneration.projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 54, "n_typed": 46, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 32, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granite_speech.GraniteSpeechDummyInputsBuilder", "methods": [ { "kind": "function", "name": "GraniteSpeechDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GraniteSpeechDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granite_speech.GraniteSpeechConformerBlock", "methods": [ { "kind": "function", "name": "GraniteSpeechConformerBlock.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteSpeechConformerBlock.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteSpeechConformerBlock.ff1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerBlock.conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerBlock.ff2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerBlock.post_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 5, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granite_speech.GraniteSpeechConformerConvModule", "methods": [ { "kind": "function", "name": "GraniteSpeechConformerConvModule.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteSpeechConformerConvModule.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteSpeechConformerConvModule.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerConvModule.up_conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerConvModule.glu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerConvModule.depth_conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerConvModule.silu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerConvModule.batch_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerConvModule.down_conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 4, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granite_speech.GraniteSpeechConformerDepthWiseConv1d", "methods": [ { "kind": "function", "name": "GraniteSpeechConformerDepthWiseConv1d.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GraniteSpeechConformerDepthWiseConv1d.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteSpeechConformerDepthWiseConv1d.padding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechConformerDepthWiseConv1d.conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 6, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granite_speech.GraniteSpeechCTCEncoder", "methods": [ { "kind": "function", "name": "GraniteSpeechCTCEncoder.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GraniteSpeechCTCEncoder.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteSpeechCTCEncoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechCTCEncoder.attention_dists", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechCTCEncoder.input_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechCTCEncoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechCTCEncoder.out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechCTCEncoder.out_mid", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechCTCEncoder.softmax", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteSpeechCTCEncoder.num_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 4, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.granite_speech", "names": [ "vllm.model_executor.models.granite_speech.GraniteSpeechAudioInputs", "vllm.model_executor.models.granite_speech.GraniteSpeechCTCEncoder", "vllm.model_executor.models.granite_speech.GraniteSpeechConformerAttention", "vllm.model_executor.models.granite_speech.GraniteSpeechConformerBlock", "vllm.model_executor.models.granite_speech.GraniteSpeechConformerConvModule", "vllm.model_executor.models.granite_speech.GraniteSpeechConformerDepthWiseConv1d", "vllm.model_executor.models.granite_speech.GraniteSpeechConformerFeedForward", "vllm.model_executor.models.granite_speech.GraniteSpeechDummyInputsBuilder", "vllm.model_executor.models.granite_speech.GraniteSpeechEncoderProjector", "vllm.model_executor.models.granite_speech.GraniteSpeechForConditionalGeneration", "vllm.model_executor.models.granite_speech.GraniteSpeechMultiModalProcessingInfo", "vllm.model_executor.models.granite_speech.GraniteSpeechMultiModalProcessor", "vllm.model_executor.models.granite_speech.ISO639_1_SUPPORTED_LANGS" ], "n_typable": 165, "n_typed": 103, "n_any": 0, "n_untyped": 62, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 38, "n_method_overloads": 38, "n_method_params": 74, "n_classes": 12, "n_attrs": 56, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/granitemoe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.granitemoe.GraniteMoeAttention", "methods": [ { "kind": "function", "name": "GraniteMoeAttention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "GraniteMoeAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteMoeAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 13, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granitemoe.GraniteMoeForCausalLM", "methods": [ { "kind": "function", "name": "GraniteMoeForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteMoeForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteMoeForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GraniteMoeForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteMoeForCausalLM.make_empty_intermediate_tensors", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GraniteMoeForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteMoeForCausalLM.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GraniteMoeForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GraniteMoeForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GraniteMoeForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 17, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granitemoe.GraniteMoeModel", "methods": [ { "kind": "function", "name": "GraniteMoeModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteMoeModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteMoeModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GraniteMoeModel._load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteMoeModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteMoeModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeModel.embedding_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granitemoe.GraniteMoeMoE", "methods": [ { "kind": "function", "name": "GraniteMoeMoE.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "GraniteMoeMoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteMoeMoE.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeMoE.is_sequence_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeMoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeMoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 10, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granitemoe.GraniteMoeDecoderLayer", "methods": [ { "kind": "function", "name": "GraniteMoeDecoderLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteMoeDecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteMoeDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeDecoderLayer.block_sparse_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeDecoderLayer.residual_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 6, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.granitemoe", "names": [ "vllm.model_executor.models.granitemoe.GraniteMoeAttention", "vllm.model_executor.models.granitemoe.GraniteMoeDecoderLayer", "vllm.model_executor.models.granitemoe.GraniteMoeForCausalLM", "vllm.model_executor.models.granitemoe.GraniteMoeMoE", "vllm.model_executor.models.granitemoe.GraniteMoeModel" ], "n_typable": 96, "n_typed": 59, "n_any": 0, "n_untyped": 37, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 46, "n_classes": 5, "n_attrs": 36, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/granitemoehybrid.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.granitemoehybrid.GraniteMoeHybridForCausalLM", "methods": [ { "kind": "function", "name": "GraniteMoeHybridForCausalLM.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteMoeHybridForCausalLM.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteMoeHybridForCausalLM.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GraniteMoeHybridForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteMoeHybridForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteMoeHybridForCausalLM.forward", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "GraniteMoeHybridForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteMoeHybridForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteMoeHybridForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GraniteMoeHybridForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GraniteMoeHybridForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridForCausalLM.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridForCausalLM.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 17, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 12, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granitemoehybrid.GraniteMoeHybridAttention", "methods": [ { "kind": "function", "name": "GraniteMoeHybridAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "GraniteMoeHybridAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteMoeHybridAttention.causal", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttention.attention_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttention.attention_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttention.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 9, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granitemoehybrid.GraniteMoeHybridMambaDecoderLayer", "methods": [ { "kind": "function", "name": "GraniteMoeHybridMambaDecoderLayer.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "GraniteMoeHybridMambaDecoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteMoeHybridMambaDecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridMambaDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridMambaDecoderLayer.residual_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridMambaDecoderLayer.mamba", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridMambaDecoderLayer.block_sparse_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridMambaDecoderLayer.shared_mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridMambaDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridMambaDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 9, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granitemoehybrid.GraniteMoeHybridModel", "methods": [ { "kind": "function", "name": "GraniteMoeHybridModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteMoeHybridModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteMoeHybridModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GraniteMoeHybridModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GraniteMoeHybridModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteMoeHybridModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridModel.embedding_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 12, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.granitemoehybrid.ALL_DECODER_LAYER_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granitemoehybrid.GraniteMoeHybridAttentionDecoderLayer", "methods": [ { "kind": "function", "name": "GraniteMoeHybridAttentionDecoderLayer.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "GraniteMoeHybridAttentionDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteMoeHybridAttentionDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttentionDecoderLayer.residual_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttentionDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttentionDecoderLayer.block_sparse_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttentionDecoderLayer.shared_mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttentionDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeHybridAttentionDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.granitemoehybrid", "names": [ "vllm.model_executor.models.granitemoehybrid.ALL_DECODER_LAYER_TYPES", "vllm.model_executor.models.granitemoehybrid.GraniteMoeHybridAttention", "vllm.model_executor.models.granitemoehybrid.GraniteMoeHybridAttentionDecoderLayer", "vllm.model_executor.models.granitemoehybrid.GraniteMoeHybridForCausalLM", "vllm.model_executor.models.granitemoehybrid.GraniteMoeHybridMambaDecoderLayer", "vllm.model_executor.models.granitemoehybrid.GraniteMoeHybridModel" ], "n_typable": 108, "n_typed": 58, "n_any": 0, "n_untyped": 50, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 45, "n_classes": 5, "n_attrs": 47, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/granitemoeshared.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.granitemoeshared.GraniteMoeSharedForCausalLM", "methods": [ { "kind": "function", "name": "GraniteMoeSharedForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteMoeSharedForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteMoeSharedForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GraniteMoeSharedForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteMoeSharedForCausalLM.make_empty_intermediate_tensors", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GraniteMoeSharedForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteMoeSharedForCausalLM.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GraniteMoeSharedForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GraniteMoeSharedForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GraniteMoeSharedForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 17, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granitemoeshared.GraniteMoeSharedModel", "methods": [ { "kind": "function", "name": "GraniteMoeSharedModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteMoeSharedModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteMoeSharedModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GraniteMoeSharedModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteMoeSharedModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedModel.embedding_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granitemoeshared.GraniteMoeSharedMLP", "methods": [ { "kind": "function", "name": "GraniteMoeSharedMLP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GraniteMoeSharedMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteMoeSharedMLP.input_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedMLP.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedMLP.input_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedMLP.output_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 5, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.granitemoeshared.GraniteMoeSharedDecoderLayer", "methods": [ { "kind": "function", "name": "GraniteMoeSharedDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GraniteMoeSharedDecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteMoeSharedDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedDecoderLayer.block_sparse_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedDecoderLayer.shared_mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteMoeSharedDecoderLayer.residual_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 8, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.granitemoeshared", "names": [ "vllm.model_executor.models.granitemoeshared.GraniteMoeSharedDecoderLayer", "vllm.model_executor.models.granitemoeshared.GraniteMoeSharedForCausalLM", "vllm.model_executor.models.granitemoeshared.GraniteMoeSharedMLP", "vllm.model_executor.models.granitemoeshared.GraniteMoeSharedModel" ], "n_typable": 66, "n_typed": 41, "n_any": 0, "n_untyped": 25, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 30, "n_classes": 4, "n_attrs": 25, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/gritlm.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.gritlm.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.gritlm.GritLMMeanPool", "methods": [ { "kind": "function", "name": "GritLMMeanPool.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GritLMMeanPool._find_array", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GritLMMeanPool._get_instruction_len", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GritLMMeanPool.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GritLMMeanPool.get_pooling_updates", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GritLMMeanPool.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GritLMMeanPool.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GritLMMeanPool.token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GritLMMeanPool.user_pattern_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GritLMMeanPool.embed_newline_pattern_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GritLMMeanPool.embed_pattern_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 14, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gritlm.GritLMPooler", "methods": [ { "kind": "function", "name": "GritLMPooler.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.gritlm.GritLM", "methods": [ { "kind": "function", "name": "GritLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GritLM.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GritLM.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.gritlm", "names": [ "vllm.model_executor.models.gritlm.GritLM", "vllm.model_executor.models.gritlm.GritLMMeanPool", "vllm.model_executor.models.gritlm.GritLMPooler", "vllm.model_executor.models.gritlm.logger" ], "n_typable": 28, "n_typed": 18, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 13, "n_classes": 3, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/grok1.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.grok1.DEFAULT_ROUTER_LOGIT_SOFTCAP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.grok1.Grok1DecoderLayer", "methods": [ { "kind": "function", "name": "Grok1DecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Grok1DecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Grok1DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1DecoderLayer.use_fp8", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1DecoderLayer.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1DecoderLayer.moe_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1DecoderLayer.residual_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1DecoderLayer.residual_moe_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1DecoderLayer.pre_attn_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1DecoderLayer.post_attn_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1DecoderLayer.pre_moe_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1DecoderLayer.post_moe_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 8, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.grok1.Grok1Attention", "methods": [ { "kind": "function", "name": "Grok1Attention.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "Grok1Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Grok1Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Attention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Attention.attn_multiplier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 12, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.grok1.Grok1ForCausalLM", "methods": [ { "kind": "function", "name": "Grok1ForCausalLM.get_weight_name_remapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Grok1ForCausalLM.ckpt_gate_proj_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Grok1ForCausalLM.ckpt_down_proj_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Grok1ForCausalLM.ckpt_up_proj_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.grok1.GrokForCausalLM", "methods": [ { "kind": "function", "name": "GrokForCausalLM.__new__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GrokForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.grok1.DEFAULT_OUTPUT_MULTIPLIER_SCALE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.grok1.DEFAULT_EMBEDDING_MULTIPLIER_SCALE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.grok1.Grok2ForCausalLM", "methods": [ { "kind": "function", "name": "Grok2ForCausalLM.get_weight_name_remapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Grok2ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Grok2ForCausalLM.ckpt_gate_proj_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Grok2ForCausalLM.ckpt_down_proj_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Grok2ForCausalLM.ckpt_up_proj_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.grok1.DEFAULT_ATTN_OUTPUT_MULTIPLIER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.grok1.Grok1MoE", "methods": [ { "kind": "function", "name": "Grok1MoE.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "Grok1MoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Grok1MoE.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1MoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1MoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1MoE.router_logit_soft_cap", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.grok1.Grok1MLP", "methods": [ { "kind": "function", "name": "Grok1MLP.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Grok1MLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Grok1MLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1MLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1MLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 7, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.grok1.GrokBaseForCausalLM", "methods": [ { "kind": "function", "name": "GrokBaseForCausalLM.get_weight_name_remapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GrokBaseForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GrokBaseForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GrokBaseForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GrokBaseForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GrokBaseForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GrokBaseForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GrokBaseForCausalLM.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GrokBaseForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GrokBaseForCausalLM.ckpt_gate_proj_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GrokBaseForCausalLM.ckpt_down_proj_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GrokBaseForCausalLM.ckpt_up_proj_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GrokBaseForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GrokBaseForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GrokBaseForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GrokBaseForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GrokBaseForCausalLM.output_multiplier_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GrokBaseForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GrokBaseForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 18, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 9, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.grok1.Grok1Model", "methods": [ { "kind": "function", "name": "Grok1Model.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Grok1Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Grok1Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Grok1Model.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Grok1Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Grok1Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Model.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Model.ckpt_gate_proj_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Model.ckpt_down_proj_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Model.ckpt_up_proj_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Model.weight_name_remapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Model.embedding_multiplier_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok1Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 16, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 11, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.grok1.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.grok1", "names": [ "vllm.model_executor.models.grok1.DEFAULT_ATTN_OUTPUT_MULTIPLIER", "vllm.model_executor.models.grok1.DEFAULT_EMBEDDING_MULTIPLIER_SCALE", "vllm.model_executor.models.grok1.DEFAULT_OUTPUT_MULTIPLIER_SCALE", "vllm.model_executor.models.grok1.DEFAULT_ROUTER_LOGIT_SOFTCAP", "vllm.model_executor.models.grok1.Grok1Attention", "vllm.model_executor.models.grok1.Grok1DecoderLayer", "vllm.model_executor.models.grok1.Grok1ForCausalLM", "vllm.model_executor.models.grok1.Grok1MLP", "vllm.model_executor.models.grok1.Grok1MoE", "vllm.model_executor.models.grok1.Grok1Model", "vllm.model_executor.models.grok1.Grok2ForCausalLM", "vllm.model_executor.models.grok1.GrokBaseForCausalLM", "vllm.model_executor.models.grok1.GrokForCausalLM", "vllm.model_executor.models.grok1.logger" ], "n_typable": 136, "n_typed": 77, "n_any": 0, "n_untyped": 59, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 23, "n_method_overloads": 23, "n_method_params": 57, "n_classes": 9, "n_attrs": 69, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/h2ovl.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.h2ovl.resolve_h2ovl_min_max_num", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.h2ovl.H2OVLChatModel", "methods": [ { "kind": "function", "name": "H2OVLChatModel._init_vision_model", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.h2ovl.calculate_h2ovl_targets", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.models.h2ovl.image_to_pixel_values_h2ovl", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "class", "name": "vllm.model_executor.models.h2ovl.H2OVLProcessingInfo", "methods": [ { "kind": "function", "name": "H2OVLProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "H2OVLProcessingInfo.get_num_image_tokens", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.h2ovl.H2OVLProcessor", "methods": [ { "kind": "function", "name": "H2OVLProcessor.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "H2OVLProcessor.get_image_repl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "H2OVLProcessor.resolve_min_max_num", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "H2OVLProcessor.resolve_target_ratios", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "H2OVLProcessor.get_num_image_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "H2OVLProcessor._images_to_pixel_values_lst", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "H2OVLProcessor.image_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "H2OVLProcessor.use_msac", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 32, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 25, "n_attrs": 1, "n_properties": 1 }, { "kind": "function", "name": "vllm.model_executor.models.h2ovl.dynamic_preprocess_h2ovl", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.h2ovl.H2OVLMultiModalProcessor", "methods": [ { "kind": "function", "name": "H2OVLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "H2OVLMultiModalProcessor._cached_apply_hf_processor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.h2ovl.get_h2ovl_target_ratios", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.models.h2ovl", "names": [ "vllm.model_executor.models.h2ovl.H2OVLChatModel", "vllm.model_executor.models.h2ovl.H2OVLMultiModalProcessor", "vllm.model_executor.models.h2ovl.H2OVLProcessingInfo", "vllm.model_executor.models.h2ovl.H2OVLProcessor", "vllm.model_executor.models.h2ovl.calculate_h2ovl_targets", "vllm.model_executor.models.h2ovl.dynamic_preprocess_h2ovl", "vllm.model_executor.models.h2ovl.get_h2ovl_target_ratios", "vllm.model_executor.models.h2ovl.image_to_pixel_values_h2ovl", "vllm.model_executor.models.h2ovl.resolve_h2ovl_min_max_num" ], "n_typable": 79, "n_typed": 77, "n_any": 0, "n_untyped": 2, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 22, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 39, "n_classes": 4, "n_attrs": 1, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/hunyuan_v1.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.hunyuan_v1.HunYuanCrossAttention", "methods": [ { "kind": "function", "name": "HunYuanCrossAttention.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "HunYuanCrossAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanCrossAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.use_qk_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.layer_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.q_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.query_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanCrossAttention.key_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 15, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 13, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_v1.HunYuanDenseV1ForCausalLM", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_v1.HunYuanSparseMoeBlock", "methods": [ { "kind": "function", "name": "HunYuanSparseMoeBlock.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "HunYuanSparseMoeBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanSparseMoeBlock.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanSparseMoeBlock.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanSparseMoeBlock.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanSparseMoeBlock.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanSparseMoeBlock.n_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanSparseMoeBlock.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanSparseMoeBlock.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanSparseMoeBlock.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanSparseMoeBlock.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanSparseMoeBlock.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanSparseMoeBlock.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanSparseMoeBlock.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanSparseMoeBlock.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanSparseMoeBlock.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanSparseMoeBlock.shared_mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 7, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_v1.HunYuanDecoderLayer", "methods": [ { "kind": "function", "name": "HunYuanDecoderLayer.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "HunYuanDecoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanDecoderLayer.layer_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanDecoderLayer.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 12, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_v1.HunYuanModel", "methods": [ { "kind": "function", "name": "HunYuanModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunYuanModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunYuanModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "HunYuanModel._split_qkv_weight", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunYuanModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HunYuanModel.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanModel.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanModel.aux_hidden_state_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 12, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_v1.HunyuanV1ModelBase", "methods": [ { "kind": "function", "name": "HunyuanV1ModelBase.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunyuanV1ModelBase.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunyuanV1ModelBase.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HunyuanV1ModelBase.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "HunyuanV1ModelBase.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunyuanV1ModelBase.make_empty_intermediate_tensors", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "HunyuanV1ModelBase.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunyuanV1ModelBase.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunyuanV1ModelBase.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "HunyuanV1ModelBase.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanV1ModelBase.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanV1ModelBase.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanV1ModelBase.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanV1ModelBase.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 20, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 13, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_v1.HunYuanMoEV1Base", "methods": [ { "kind": "function", "name": "HunYuanMoEV1Base.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunYuanMoEV1Base.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunYuanMoEV1Base.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanMoEV1Base.expert_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanMoEV1Base.num_expert_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanMoEV1Base.moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanMoEV1Base.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanMoEV1Base.num_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanMoEV1Base.num_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanMoEV1Base.num_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanMoEV1Base.num_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanMoEV1Base.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 6, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_v1.HunYuanAttention", "methods": [ { "kind": "function", "name": "HunYuanAttention.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "HunYuanAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.use_qk_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.layer_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.query_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanAttention.key_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 15, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 13, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_v1.HunYuanMLP", "methods": [ { "kind": "function", "name": "HunYuanMLP.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "HunYuanMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_v1.HunYuanDenseV1Base", "methods": [ { "kind": "function", "name": "HunYuanDenseV1Base.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_v1.HunYuanMoEV1ForCausalLM", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.hunyuan_v1", "names": [ "vllm.model_executor.models.hunyuan_v1.HunYuanAttention", "vllm.model_executor.models.hunyuan_v1.HunYuanCrossAttention", "vllm.model_executor.models.hunyuan_v1.HunYuanDecoderLayer", "vllm.model_executor.models.hunyuan_v1.HunYuanDenseV1Base", "vllm.model_executor.models.hunyuan_v1.HunYuanDenseV1ForCausalLM", "vllm.model_executor.models.hunyuan_v1.HunYuanMLP", "vllm.model_executor.models.hunyuan_v1.HunYuanMoEV1Base", "vllm.model_executor.models.hunyuan_v1.HunYuanMoEV1ForCausalLM", "vllm.model_executor.models.hunyuan_v1.HunYuanModel", "vllm.model_executor.models.hunyuan_v1.HunYuanSparseMoeBlock", "vllm.model_executor.models.hunyuan_v1.HunyuanV1ModelBase" ], "n_typable": 188, "n_typed": 97, "n_any": 0, "n_untyped": 91, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 28, "n_method_overloads": 28, "n_method_params": 78, "n_classes": 11, "n_attrs": 83, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/hunyuan_vision.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.hunyuan_vision.HunYuanVisionAttention", "methods": [ { "kind": "function", "name": "HunYuanVisionAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "HunYuanVisionAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanVisionAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionAttention.hidden_size_per_attention_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionAttention.num_attention_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionAttention.qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 8, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_vision.HunYuanVLImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanVLImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImagePixelInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_vision.HunYuanVisionPatchEmbed", "methods": [ { "kind": "function", "name": "HunYuanVisionPatchEmbed.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunYuanVisionPatchEmbed.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanVisionPatchEmbed.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchEmbed.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchEmbed.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchEmbed.num_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchEmbed.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchEmbed.interpolate_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchEmbed.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchEmbed.max_num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchEmbed.num_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchEmbed.position_edge", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchEmbed.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchEmbed.patch_pos_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 4, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_vision.HunYuanVLDummyInputsBuilder", "methods": [ { "kind": "function", "name": "HunYuanVLDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunYuanVLDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_vision.HunYuanVLImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanVLImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImageEmbeddingInputs.image_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImageEmbeddingInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_vision.HunYuanVisionBlock", "methods": [ { "kind": "function", "name": "HunYuanVisionBlock.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "HunYuanVisionBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanVisionBlock.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionBlock.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionBlock.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 10, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.hunyuan_vision.HunYuanVLImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_vision.HunYuanVLMultiModalProcessor", "methods": [ { "kind": "function", "name": "HunYuanVLMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "HunYuanVLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "HunYuanVLMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_vision.HunYuanVisionPatchMerger", "methods": [ { "kind": "function", "name": "HunYuanVisionPatchMerger.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "HunYuanVisionPatchMerger.forward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanVisionPatchMerger.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchMerger.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchMerger.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchMerger.image_newline", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchMerger.image_begin", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchMerger.image_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchMerger.image_sep", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchMerger.before_rms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionPatchMerger.after_rms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 0, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_vision.HunYuanVLProcessingInfo", "methods": [ { "kind": "function", "name": "HunYuanVLProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HunYuanVLProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunYuanVLProcessingInfo.get_image_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunYuanVLProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HunYuanVLProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HunYuanVLProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunYuanVLProcessingInfo._get_vision_info", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "HunYuanVLProcessingInfo.get_num_image_tokens", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "HunYuanVLProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HunYuanVLProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 24, "n_typed": 22, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 14, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_vision.HunYuanVisionTransformer", "methods": [ { "kind": "function", "name": "HunYuanVisionTransformer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "HunYuanVisionTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunYuanVisionTransformer.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "HunYuanVisionTransformer.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "HunYuanVisionTransformer.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "HunYuanVisionTransformer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionTransformer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionTransformer.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionTransformer.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionTransformer.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionTransformer.perceive", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 6, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_vision.HunYuanVLMultiModalDataParser", "methods": [ { "kind": "function", "name": "HunYuanVLMultiModalDataParser._parse_image_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_vision.HunYuanVisionMLP", "methods": [ { "kind": "function", "name": "HunYuanVisionMLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "HunYuanVisionMLP.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanVisionMLP.dense_h_to_4h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionMLP.dense_4h_to_h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVisionMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.hunyuan_vision.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.hunyuan_vision.HunYuanVLForConditionalGeneration", "methods": [ { "kind": "function", "name": "HunYuanVLForConditionalGeneration.get_xdrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunYuanVLForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunYuanVLForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunYuanVLForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunYuanVLForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunYuanVLForConditionalGeneration._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunYuanVLForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunYuanVLForConditionalGeneration.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunYuanVLForConditionalGeneration.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HunYuanVLForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "HunYuanVLForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunYuanVLForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunYuanVLForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanVLForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLForConditionalGeneration.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "HunYuanVLForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLForConditionalGeneration.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 36, "n_typed": 30, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 18, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.hunyuan_vision", "names": [ "vllm.model_executor.models.hunyuan_vision.HunYuanVLDummyInputsBuilder", "vllm.model_executor.models.hunyuan_vision.HunYuanVLForConditionalGeneration", "vllm.model_executor.models.hunyuan_vision.HunYuanVLImageEmbeddingInputs", "vllm.model_executor.models.hunyuan_vision.HunYuanVLImageInputs", "vllm.model_executor.models.hunyuan_vision.HunYuanVLImagePixelInputs", "vllm.model_executor.models.hunyuan_vision.HunYuanVLMultiModalDataParser", "vllm.model_executor.models.hunyuan_vision.HunYuanVLMultiModalProcessor", "vllm.model_executor.models.hunyuan_vision.HunYuanVLProcessingInfo", "vllm.model_executor.models.hunyuan_vision.HunYuanVisionAttention", "vllm.model_executor.models.hunyuan_vision.HunYuanVisionBlock", "vllm.model_executor.models.hunyuan_vision.HunYuanVisionMLP", "vllm.model_executor.models.hunyuan_vision.HunYuanVisionPatchEmbed", "vllm.model_executor.models.hunyuan_vision.HunYuanVisionPatchMerger", "vllm.model_executor.models.hunyuan_vision.HunYuanVisionTransformer", "vllm.model_executor.models.hunyuan_vision.logger" ], "n_typable": 181, "n_typed": 119, "n_any": 0, "n_untyped": 62, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 42, "n_method_overloads": 42, "n_method_params": 83, "n_classes": 13, "n_attrs": 55, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/hyperclovax_vision.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.hyperclovax_vision.anyres_postprocessing", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "class", "name": "vllm.model_executor.models.hyperclovax_vision.HCXVisionMultiModalProcessor", "methods": [ { "kind": "function", "name": "HCXVisionMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "HCXVisionMultiModalProcessor._hf_processor_applies_updates", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "HCXVisionMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "HCXVisionMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 17, "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.hyperclovax_vision.unpad_image", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.hyperclovax_vision.get_num_combined_frames", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.hyperclovax_vision.select_best_resolution", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.hyperclovax_vision.HCXVisionVideoPixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "HCXVisionVideoPixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionVideoPixelInputs.pixel_values_videos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.hyperclovax_vision.VIDEO_TOKEN", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.hyperclovax_vision.HCXVisionMlp", "methods": [ { "kind": "function", "name": "HCXVisionMlp.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "HCXVisionMlp.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HCXVisionMlp.mm_projector_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionMlp.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionMlp.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionMlp.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 0, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.hyperclovax_vision.reshape_and_unpad_image_features", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "class", "name": "vllm.model_executor.models.hyperclovax_vision.HCXVisionImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "HCXVisionImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionImagePixelInputs.pixel_values_images", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionImagePixelInputs.image_sizes_images", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hyperclovax_vision.HCXVisionCAbstractor", "methods": [ { "kind": "function", "name": "HCXVisionCAbstractor.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "HCXVisionCAbstractor.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "HCXVisionCAbstractor._forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "HCXVisionCAbstractor._forward_adaptive_num_query", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "HCXVisionCAbstractor.build_net", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "HCXVisionCAbstractor.build_mlp", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HCXVisionCAbstractor.num_input_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionCAbstractor.output_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionCAbstractor.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionCAbstractor.pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionCAbstractor.prenorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 36, "n_typed": 28, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 25, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.hyperclovax_vision.init_vision_tower_for_hcxvision", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.model_executor.models.hyperclovax_vision.IMAGE_TOKEN", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.hyperclovax_vision.HCXVisionDummyInputsBuilder", "methods": [ { "kind": "function", "name": "HCXVisionDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HCXVisionDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.hyperclovax_vision.HCXVisionForCausalLM", "methods": [ { "kind": "function", "name": "HCXVisionForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HCXVisionForCausalLM.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HCXVisionForCausalLM._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HCXVisionForCausalLM._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HCXVisionForCausalLM._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HCXVisionForCausalLM._process_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HCXVisionForCausalLM._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HCXVisionForCausalLM.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HCXVisionForCausalLM.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "HCXVisionForCausalLM.forward_images", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HCXVisionForCausalLM.forward_videos", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HCXVisionForCausalLM._prepare_multimodal_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HCXVisionForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HCXVisionForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HCXVisionForCausalLM._init_possible_resolutions", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HCXVisionForCausalLM._init_mm_projector", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HCXVisionForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "HCXVisionForCausalLM.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionForCausalLM.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionForCausalLM.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionForCausalLM.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionForCausalLM.mm_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionForCausalLM.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HCXVisionForCausalLM.image_newline", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 50, "n_typed": 34, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 26, "n_attrs": 9, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.hyperclovax_vision.get_anyres_image_grid_shape", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.models.hyperclovax_vision.HCXVisionProcessingInfo", "methods": [ { "kind": "function", "name": "HCXVisionProcessingInfo.get_vision_encoder_info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HCXVisionProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HCXVisionProcessingInfo.get_num_image_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HCXVisionProcessingInfo.get_num_video_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HCXVisionProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HCXVisionProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.hyperclovax_vision", "names": [ "vllm.model_executor.models.hyperclovax_vision.HCXVisionCAbstractor", "vllm.model_executor.models.hyperclovax_vision.HCXVisionDummyInputsBuilder", "vllm.model_executor.models.hyperclovax_vision.HCXVisionForCausalLM", "vllm.model_executor.models.hyperclovax_vision.HCXVisionImagePixelInputs", "vllm.model_executor.models.hyperclovax_vision.HCXVisionMlp", "vllm.model_executor.models.hyperclovax_vision.HCXVisionMultiModalProcessor", "vllm.model_executor.models.hyperclovax_vision.HCXVisionProcessingInfo", "vllm.model_executor.models.hyperclovax_vision.HCXVisionVideoPixelInputs", "vllm.model_executor.models.hyperclovax_vision.IMAGE_TOKEN", "vllm.model_executor.models.hyperclovax_vision.VIDEO_TOKEN", "vllm.model_executor.models.hyperclovax_vision.anyres_postprocessing", "vllm.model_executor.models.hyperclovax_vision.get_anyres_image_grid_shape", "vllm.model_executor.models.hyperclovax_vision.get_num_combined_frames", "vllm.model_executor.models.hyperclovax_vision.init_vision_tower_for_hcxvision", "vllm.model_executor.models.hyperclovax_vision.reshape_and_unpad_image_features", "vllm.model_executor.models.hyperclovax_vision.select_best_resolution", "vllm.model_executor.models.hyperclovax_vision.unpad_image" ], "n_typable": 173, "n_typed": 135, "n_any": 0, "n_untyped": 38, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 30, "n_methods": 36, "n_method_overloads": 36, "n_method_params": 76, "n_classes": 8, "n_attrs": 25, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/idefics2_vision_model.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.idefics2_vision_model.Idefics2VisionAttention", "methods": [ { "kind": "function", "name": "Idefics2VisionAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Idefics2VisionAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Idefics2VisionAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionAttention.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionAttention.num_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 6, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.idefics2_vision_model.Idefics2Encoder", "methods": [ { "kind": "function", "name": "Idefics2Encoder.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Idefics2Encoder.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Idefics2Encoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2Encoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.idefics2_vision_model.Idefics2EncoderLayer", "methods": [ { "kind": "function", "name": "Idefics2EncoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Idefics2EncoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Idefics2EncoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2EncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2EncoderLayer.layer_norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2EncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2EncoderLayer.layer_norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.idefics2_vision_model.Idefics2VisionMLP", "methods": [ { "kind": "function", "name": "Idefics2VisionMLP.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Idefics2VisionMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Idefics2VisionMLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionMLP.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.idefics2_vision_model.Idefics2VisionEmbeddings", "methods": [ { "kind": "function", "name": "Idefics2VisionEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Idefics2VisionEmbeddings.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Idefics2VisionEmbeddings.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionEmbeddings.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionEmbeddings.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionEmbeddings.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionEmbeddings.num_patches_per_side", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionEmbeddings.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionEmbeddings.num_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionEmbeddings.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 5, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.idefics2_vision_model.Idefics2VisionTransformer", "methods": [ { "kind": "function", "name": "Idefics2VisionTransformer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Idefics2VisionTransformer.get_input_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Idefics2VisionTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Idefics2VisionTransformer.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Idefics2VisionTransformer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionTransformer.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionTransformer.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionTransformer.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionTransformer.require_post_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics2VisionTransformer.post_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 11, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.idefics2_vision_model", "names": [ "vllm.model_executor.models.idefics2_vision_model.Idefics2Encoder", "vllm.model_executor.models.idefics2_vision_model.Idefics2EncoderLayer", "vllm.model_executor.models.idefics2_vision_model.Idefics2VisionAttention", "vllm.model_executor.models.idefics2_vision_model.Idefics2VisionEmbeddings", "vllm.model_executor.models.idefics2_vision_model.Idefics2VisionMLP", "vllm.model_executor.models.idefics2_vision_model.Idefics2VisionTransformer" ], "n_typable": 79, "n_typed": 41, "n_any": 0, "n_untyped": 38, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 30, "n_classes": 6, "n_attrs": 35, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/idefics3.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.idefics3.Idefics3ProcessingInfo", "methods": [ { "kind": "function", "name": "Idefics3ProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Idefics3ProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Idefics3ProcessingInfo._resize_output_size", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Idefics3ProcessingInfo._get_resize_output_image_size", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Idefics3ProcessingInfo._get_image_feature_grid_size", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Idefics3ProcessingInfo.get_num_patches", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Idefics3ProcessingInfo._get_image_token", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Idefics3ProcessingInfo.get_image_repl", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Idefics3ProcessingInfo.get_num_image_tokens", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 35, "n_typed": 35, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 26, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.idefics3.Idefics3MultiModalProcessor", "methods": [ { "kind": "function", "name": "Idefics3MultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Idefics3MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Idefics3MultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.idefics3.Idefics3DummyInputsBuilder", "methods": [ { "kind": "function", "name": "Idefics3DummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Idefics3DummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.idefics3.Idefics3Model", "methods": [ { "kind": "function", "name": "Idefics3Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Idefics3Model.image_pixels_to_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Idefics3Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Idefics3Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Idefics3Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3Model.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3Model.connector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3Model.text_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3Model.image_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3Model.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 12, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.idefics3.Idefics3ImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Idefics3ImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3ImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3ImagePixelInputs.pixel_attention_mask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3ImagePixelInputs.num_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.idefics3.Idefics3SimpleMLP", "methods": [ { "kind": "function", "name": "Idefics3SimpleMLP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Idefics3SimpleMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Idefics3SimpleMLP.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.idefics3.Idefics3Connector", "methods": [ { "kind": "function", "name": "Idefics3Connector.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Idefics3Connector.pixel_shuffle", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Idefics3Connector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Idefics3Connector.scale_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3Connector.modality_projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.idefics3.Idefics3ImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Idefics3ImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3ImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.idefics3.Idefics3ForConditionalGeneration", "methods": [ { "kind": "function", "name": "Idefics3ForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Idefics3ForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Idefics3ForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Idefics3ForConditionalGeneration._process_image_pixels", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Idefics3ForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Idefics3ForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Idefics3ForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Idefics3ForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Idefics3ForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Idefics3ForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Idefics3ForConditionalGeneration.get_num_mm_encoder_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Idefics3ForConditionalGeneration.get_num_mm_connector_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Idefics3ForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Idefics3ForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3ForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3ForConditionalGeneration.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3ForConditionalGeneration.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3ForConditionalGeneration.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Idefics3ForConditionalGeneration.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 28, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 17, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.idefics3.ImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.idefics3", "names": [ "vllm.model_executor.models.idefics3.Idefics3Connector", "vllm.model_executor.models.idefics3.Idefics3DummyInputsBuilder", "vllm.model_executor.models.idefics3.Idefics3ForConditionalGeneration", "vllm.model_executor.models.idefics3.Idefics3ImageEmbeddingInputs", "vllm.model_executor.models.idefics3.Idefics3ImagePixelInputs", "vllm.model_executor.models.idefics3.Idefics3Model", "vllm.model_executor.models.idefics3.Idefics3MultiModalProcessor", "vllm.model_executor.models.idefics3.Idefics3ProcessingInfo", "vllm.model_executor.models.idefics3.Idefics3SimpleMLP", "vllm.model_executor.models.idefics3.ImageInputs" ], "n_typable": 133, "n_typed": 113, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 35, "n_method_overloads": 35, "n_method_params": 75, "n_classes": 9, "n_attrs": 24, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/intern_vit.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.intern_vit.InternVisionModel", "methods": [ { "kind": "function", "name": "InternVisionModel.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "InternVisionModel.get_input_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InternVisionModel.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternVisionModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternVisionModel.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InternVisionModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionModel.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionModel.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionModel.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.intern_vit.InternMLP", "methods": [ { "kind": "function", "name": "InternMLP.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InternMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternMLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternMLP.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.intern_vit.InternVisionEncoder", "methods": [ { "kind": "function", "name": "InternVisionEncoder.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "InternVisionEncoder.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternVisionEncoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEncoder.layer_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEncoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.intern_vit.InternParallelAttention", "methods": [ { "kind": "function", "name": "InternParallelAttention.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "InternParallelAttention._apply_qk_norm", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternParallelAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternParallelAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternParallelAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternParallelAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternParallelAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternParallelAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternParallelAttention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternParallelAttention.dummy_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternParallelAttention.num_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternParallelAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternParallelAttention.qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternParallelAttention.qk_normalization", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternParallelAttention.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternParallelAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternParallelAttention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternParallelAttention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 9, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.intern_vit.InternVisionEmbeddings", "methods": [ { "kind": "function", "name": "InternVisionEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternVisionEmbeddings._get_pos_embed", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InternVisionEmbeddings._get_position_embedding", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternVisionEmbeddings.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternVisionEmbeddings.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEmbeddings.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEmbeddings.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEmbeddings.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEmbeddings.class_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEmbeddings.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEmbeddings.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEmbeddings.num_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEmbeddings.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 9, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.intern_vit.InternVisionPatchModel", "methods": [ { "kind": "function", "name": "InternVisionPatchModel.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternVisionPatchModel.get_input_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InternVisionPatchModel.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternVisionPatchModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionPatchModel.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 4, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.intern_vit.NORM2FN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.intern_vit.InternVisionEncoderLayer", "methods": [ { "kind": "function", "name": "InternVisionEncoderLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "InternVisionEncoderLayer._init_attn", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "InternVisionEncoderLayer.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternVisionEncoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEncoderLayer.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEncoderLayer.norm_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEncoderLayer.attn_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEncoderLayer.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEncoderLayer.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEncoderLayer.norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEncoderLayer.ls1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVisionEncoderLayer.ls2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 11, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.intern_vit", "names": [ "vllm.model_executor.models.intern_vit.InternMLP", "vllm.model_executor.models.intern_vit.InternParallelAttention", "vllm.model_executor.models.intern_vit.InternVisionEmbeddings", "vllm.model_executor.models.intern_vit.InternVisionEncoder", "vllm.model_executor.models.intern_vit.InternVisionEncoderLayer", "vllm.model_executor.models.intern_vit.InternVisionModel", "vllm.model_executor.models.intern_vit.InternVisionPatchModel", "vllm.model_executor.models.intern_vit.NORM2FN" ], "n_typable": 114, "n_typed": 57, "n_any": 0, "n_untyped": 57, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 46, "n_classes": 7, "n_attrs": 49, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/internlm2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.internlm2.InternLM2Attention", "methods": [ { "kind": "function", "name": "InternLM2Attention.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "InternLM2Attention.split_qkv", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternLM2Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternLM2Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.key_value_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.wqkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.wo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 13, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.internlm2.InternLM2Model", "methods": [ { "kind": "function", "name": "InternLM2Model.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InternLM2Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternLM2Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternLM2Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Model.tok_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 10, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.internlm2.InternLM2MLP", "methods": [ { "kind": "function", "name": "InternLM2MLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "InternLM2MLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternLM2MLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2MLP.w2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2MLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.internlm2.InternLMDecoderLayer", "methods": [ { "kind": "function", "name": "InternLMDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "InternLMDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternLMDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLMDecoderLayer.attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLMDecoderLayer.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLMDecoderLayer.attention_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLMDecoderLayer.ffn_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.internlm2.InternLM2ForRewardModel", "methods": [ { "kind": "function", "name": "InternLM2ForRewardModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InternLM2ForRewardModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternLM2ForRewardModel.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InternLM2ForRewardModel.head_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2ForRewardModel.v_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2ForRewardModel.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.internlm2.InternLM2ForCausalLM", "methods": [ { "kind": "function", "name": "InternLM2ForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InternLM2ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternLM2ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "InternLM2ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternLM2ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternLM2ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InternLM2ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2ForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2ForCausalLM.output", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 14, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.internlm2", "names": [ "vllm.model_executor.models.internlm2.InternLM2Attention", "vllm.model_executor.models.internlm2.InternLM2ForCausalLM", "vllm.model_executor.models.internlm2.InternLM2ForRewardModel", "vllm.model_executor.models.internlm2.InternLM2MLP", "vllm.model_executor.models.internlm2.InternLM2Model", "vllm.model_executor.models.internlm2.InternLMDecoderLayer" ], "n_typable": 105, "n_typed": 60, "n_any": 0, "n_untyped": 45, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 49, "n_classes": 6, "n_attrs": 41, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/internlm2_ve.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.internlm2_ve.InternLM2VEForCausalLM", "methods": [ { "kind": "function", "name": "InternLM2VEForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.internlm2_ve.InternLM2VEModel", "methods": [ { "kind": "function", "name": "InternLM2VEModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternLM2VEModel.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.internlm2_ve.InternLM2VEDecoderLayer", "methods": [ { "kind": "function", "name": "InternLM2VEDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "InternLM2VEDecoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternLM2VEDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2VEDecoderLayer.attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2VEDecoderLayer.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2VEDecoderLayer.feed_forward_ve", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2VEDecoderLayer.attention_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternLM2VEDecoderLayer.ffn_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 10, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.internlm2_ve", "names": [ "vllm.model_executor.models.internlm2_ve.InternLM2VEDecoderLayer", "vllm.model_executor.models.internlm2_ve.InternLM2VEForCausalLM", "vllm.model_executor.models.internlm2_ve.InternLM2VEModel" ], "n_typable": 28, "n_typed": 20, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 17, "n_classes": 3, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/interns1.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.interns1.InternS1ImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1ImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ImagePixelInputs.num_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interns1.resolve_interns1_min_max_num", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.interns1.InternS1ForConditionalGeneration", "methods": [ { "kind": "function", "name": "InternS1ForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternS1ForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternS1ForConditionalGeneration._init_vision_model", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InternS1ForConditionalGeneration._init_mlp1", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1ForConditionalGeneration.pixel_shuffle", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternS1ForConditionalGeneration.extract_feature", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1ForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1ForConditionalGeneration._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1ForConditionalGeneration._process_vision_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1ForConditionalGeneration._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1ForConditionalGeneration._set_visual_token_mask", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1ForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1ForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "InternS1ForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "InternS1ForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1ForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1ForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1ForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ForConditionalGeneration.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ForConditionalGeneration.num_image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ForConditionalGeneration.downsample_ratio", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ForConditionalGeneration.img_context_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ForConditionalGeneration.video_context_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ForConditionalGeneration.visual_token_mask", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 58, "n_typed": 41, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 28, "n_attrs": 13, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.interns1.InternS1VideoInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interns1.InternS1ProcessingInfo", "methods": [ { "kind": "function", "name": "InternS1ProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1ProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InternS1ProcessingInfo.get_num_image_tokens", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "InternS1ProcessingInfo.resolve_target_ratios", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1ProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InternS1ProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InternS1ProcessingInfo.get_num_frames_with_most_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 15, "n_typed": 14, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1.InternS1MultiModalProjector", "methods": [ { "kind": "function", "name": "InternS1MultiModalProjector.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1MultiModalProjector.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1MultiModalProjector.layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1MultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1MultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1MultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.interns1.get_interns1_target_ratios", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.interns1.InternS1VideoEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1VideoEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VideoEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.interns1.InternS1ImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interns1.InternS1MultiModalProcessor", "methods": [ { "kind": "function", "name": "InternS1MultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "InternS1MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternS1MultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1.InternS1VideoPixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1VideoPixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VideoPixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VideoPixelInputs.num_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1.InternS1ImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1ImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1.InternS1DummyInputsBuilder", "methods": [ { "kind": "function", "name": "InternS1DummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1DummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.interns1", "names": [ "vllm.model_executor.models.interns1.InternS1DummyInputsBuilder", "vllm.model_executor.models.interns1.InternS1ForConditionalGeneration", "vllm.model_executor.models.interns1.InternS1ImageEmbeddingInputs", "vllm.model_executor.models.interns1.InternS1ImageInputs", "vllm.model_executor.models.interns1.InternS1ImagePixelInputs", "vllm.model_executor.models.interns1.InternS1MultiModalProcessor", "vllm.model_executor.models.interns1.InternS1MultiModalProjector", "vllm.model_executor.models.interns1.InternS1ProcessingInfo", "vllm.model_executor.models.interns1.InternS1VideoEmbeddingInputs", "vllm.model_executor.models.interns1.InternS1VideoInputs", "vllm.model_executor.models.interns1.InternS1VideoPixelInputs", "vllm.model_executor.models.interns1.get_interns1_target_ratios", "vllm.model_executor.models.interns1.resolve_interns1_min_max_num" ], "n_typable": 119, "n_typed": 93, "n_any": 0, "n_untyped": 26, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 6, "n_methods": 31, "n_method_overloads": 31, "n_method_params": 51, "n_classes": 9, "n_attrs": 29, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/interns1_pro.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.interns1_pro.InternS1ProMoeSparseMoeBlock", "methods": [ { "kind": "function", "name": "InternS1ProMoeSparseMoeBlock.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternS1ProMoeSparseMoeBlock.get_group_offsets", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InternS1ProMoeSparseMoeBlock._custom_routing_function", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "InternS1ProMoeSparseMoeBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.n_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.is_sequence_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.n_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeSparseMoeBlock.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 12, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 16, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1_pro.InternS1ProMoeMixtureOfExperts", "methods": [ { "kind": "function", "name": "InternS1ProMoeMixtureOfExperts.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternS1ProMoeMixtureOfExperts.set_moe_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1_pro.InternS1ProMoeLLMForCausalLM", "methods": [ { "kind": "function", "name": "InternS1ProMoeLLMForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1ProMoeLLMForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeLLMForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeLLMForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeLLMForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeLLMForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeLLMForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 2, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1_pro.InternS1ProProcessingInfo", "methods": [ { "kind": "function", "name": "InternS1ProProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InternS1ProProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1_pro.InternS1ProForConditionalGeneration", "methods": [ { "kind": "function", "name": "InternS1ProForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternS1ProForConditionalGeneration.get_frope_params_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InternS1ProForConditionalGeneration.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1ProForConditionalGeneration.is_3d_moe_weight", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProForConditionalGeneration.video_pruning_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProForConditionalGeneration.is_multimodal_pruning_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProForConditionalGeneration.use_deepstack", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProForConditionalGeneration.deepstack_num_level", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProForConditionalGeneration.visual_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProForConditionalGeneration.multiscale_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProForConditionalGeneration.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 5, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1_pro.InternS1ProMoeMLP", "methods": [ { "kind": "function", "name": "InternS1ProMoeMLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "InternS1ProMoeMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1ProMoeMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1_pro.InternS1ProMoeLLMModel", "methods": [ { "kind": "function", "name": "InternS1ProMoeLLMModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1_pro.InternS1ProMoeAttention", "methods": [ { "kind": "function", "name": "InternS1ProMoeAttention.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "InternS1ProMoeAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1ProMoeAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.dual_chunk_attention_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeAttention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 16, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 14, "n_attrs": 17, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.interns1_pro.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.interns1_pro.InternS1ProMoeDecoderLayer", "methods": [ { "kind": "function", "name": "InternS1ProMoeDecoderLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternS1ProMoeDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1ProMoeDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1ProMoeDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.interns1_pro", "names": [ "vllm.model_executor.models.interns1_pro.InternS1ProForConditionalGeneration", "vllm.model_executor.models.interns1_pro.InternS1ProMoeAttention", "vllm.model_executor.models.interns1_pro.InternS1ProMoeDecoderLayer", "vllm.model_executor.models.interns1_pro.InternS1ProMoeLLMForCausalLM", "vllm.model_executor.models.interns1_pro.InternS1ProMoeLLMModel", "vllm.model_executor.models.interns1_pro.InternS1ProMoeMLP", "vllm.model_executor.models.interns1_pro.InternS1ProMoeMixtureOfExperts", "vllm.model_executor.models.interns1_pro.InternS1ProMoeSparseMoeBlock", "vllm.model_executor.models.interns1_pro.InternS1ProProcessingInfo", "vllm.model_executor.models.interns1_pro.logger" ], "n_typable": 129, "n_typed": 57, "n_any": 0, "n_untyped": 72, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 47, "n_classes": 9, "n_attrs": 63, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/interns1_vit.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.interns1_vit.InternS1VisionEncoder", "methods": [ { "kind": "function", "name": "InternS1VisionEncoder.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "InternS1VisionEncoder.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1VisionEncoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionEncoder.layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1_vit.InternSdpaAttention", "methods": [ { "kind": "function", "name": "InternSdpaAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InternSdpaAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternSdpaAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternSdpaAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternSdpaAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternSdpaAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternSdpaAttention.dummy_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternSdpaAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternSdpaAttention.q_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternSdpaAttention.k_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternSdpaAttention.v_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternSdpaAttention.qk_normalization", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternSdpaAttention.projection_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternSdpaAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternSdpaAttention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternSdpaAttention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 6, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1_vit.InternS1VisionLayer", "methods": [ { "kind": "function", "name": "InternS1VisionLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "InternS1VisionLayer._init_attn", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "InternS1VisionLayer.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1VisionLayer.attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionLayer.layernorm_before", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionLayer.layernorm_after", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionLayer.lambda_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionLayer.lambda_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 10, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.interns1_vit.NORM2FN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1_vit.InternS1VisionModel", "methods": [ { "kind": "function", "name": "InternS1VisionModel.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "InternS1VisionModel.get_input_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InternS1VisionModel.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternS1VisionModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1VisionModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionModel.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionModel.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionModel.layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1_vit.InternS1VisionPatchEmbeddings", "methods": [ { "kind": "function", "name": "InternS1VisionPatchEmbeddings.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1VisionPatchEmbeddings.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1VisionPatchEmbeddings.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionPatchEmbeddings.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionPatchEmbeddings.num_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionPatchEmbeddings.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionPatchEmbeddings.patch_shape", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionPatchEmbeddings.projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 2, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1_vit.InternS1VisionMLP", "methods": [ { "kind": "function", "name": "InternS1VisionMLP.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InternS1VisionMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1VisionMLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionMLP.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.interns1_vit.InternS1VisionEmbeddings", "methods": [ { "kind": "function", "name": "InternS1VisionEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternS1VisionEmbeddings.interpolate_pos_encoding", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InternS1VisionEmbeddings.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternS1VisionEmbeddings.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionEmbeddings.cls_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionEmbeddings.patch_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionEmbeddings.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionEmbeddings.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionEmbeddings.mask_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternS1VisionEmbeddings.position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 8, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.interns1_vit", "names": [ "vllm.model_executor.models.interns1_vit.InternS1VisionEmbeddings", "vllm.model_executor.models.interns1_vit.InternS1VisionEncoder", "vllm.model_executor.models.interns1_vit.InternS1VisionLayer", "vllm.model_executor.models.interns1_vit.InternS1VisionMLP", "vllm.model_executor.models.interns1_vit.InternS1VisionModel", "vllm.model_executor.models.interns1_vit.InternS1VisionPatchEmbeddings", "vllm.model_executor.models.interns1_vit.InternSdpaAttention", "vllm.model_executor.models.interns1_vit.NORM2FN" ], "n_typable": 100, "n_typed": 49, "n_any": 0, "n_untyped": 51, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 39, "n_classes": 7, "n_attrs": 44, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/internvl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.internvl.BaseInternVLProcessingInfo", "methods": [ { "kind": "function", "name": "BaseInternVLProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseInternVLProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseInternVLProcessingInfo.get_num_image_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseInternVLProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseInternVLProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.internvl.InternVLImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.internvl.InternVLProcessingInfo", "methods": [ { "kind": "function", "name": "InternVLProcessingInfo.get_supported_mm_limits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InternVLProcessingInfo.get_video_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InternVLProcessingInfo.get_num_frames_with_most_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternVLProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "InternVLProcessingInfo.supports_video", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.internvl.InternVLProcessor", "methods": [ { "kind": "function", "name": "InternVLProcessor.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "InternVLProcessor._videos_to_pixel_values_lst", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternVLProcessor._preprocess_video", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InternVLProcessor.__call__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "InternVLProcessor.get_image_repl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternVLProcessor.get_video_repl", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "InternVLProcessor.image_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InternVLProcessor.video_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InternVLProcessor.supports_video", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "InternVLProcessor.video_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 31, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 23, "n_attrs": 1, "n_properties": 3 }, { "kind": "class", "name": "vllm.model_executor.models.internvl.InternVLImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "InternVLImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InternVLImagePixelInputs.pixel_values_flat", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InternVLImagePixelInputs.num_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.internvl.BaseInternVLProcessor", "methods": [ { "kind": "function", "name": "BaseInternVLProcessor.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BaseInternVLProcessor.get_image_repl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseInternVLProcessor.resolve_min_max_num", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaseInternVLProcessor.resolve_target_ratios", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaseInternVLProcessor.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseInternVLProcessor._images_to_pixel_values_lst", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaseInternVLProcessor._preprocess_image", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BaseInternVLProcessor._make_batch_input", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseInternVLProcessor.__call__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "BaseInternVLProcessor.image_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "BaseInternVLProcessor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseInternVLProcessor.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseInternVLProcessor.num_image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseInternVLProcessor.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseInternVLProcessor.min_dynamic_patch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseInternVLProcessor.max_dynamic_patch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseInternVLProcessor.dynamic_image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseInternVLProcessor.use_thumbnail", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 51, "n_typed": 43, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 33, "n_attrs": 8, "n_properties": 1 }, { "kind": "function", "name": "vllm.model_executor.models.internvl.calculate_internvl_targets", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.internvl.InternVLVideoEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "InternVLVideoEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InternVLVideoEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.internvl.InternVLMultiModalProcessor", "methods": [ { "kind": "function", "name": "InternVLMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "InternVLMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternVLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.internvl.video_to_pixel_values_internvl", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.models.internvl.build_transform", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.internvl.BaseInternVLDummyInputsBuilder", "methods": [ { "kind": "function", "name": "BaseInternVLDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseInternVLDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.internvl.IMG_END", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.internvl.IMG_CONTEXT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.internvl.InternVLVideoInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.internvl.InternVLChatModel", "methods": [ { "kind": "function", "name": "InternVLChatModel.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternVLChatModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternVLChatModel._patch_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternVLChatModel._init_vision_model", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "InternVLChatModel._init_mlp1", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternVLChatModel.pixel_shuffle", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InternVLChatModel.extract_feature", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternVLChatModel._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternVLChatModel._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternVLChatModel._process_vision_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternVLChatModel._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternVLChatModel._set_visual_token_mask", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternVLChatModel.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternVLChatModel.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "InternVLChatModel.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "InternVLChatModel.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternVLChatModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternVLChatModel.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InternVLChatModel.get_num_mm_encoder_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternVLChatModel.get_num_mm_connector_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InternVLChatModel.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InternVLChatModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVLChatModel.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVLChatModel.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVLChatModel.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVLChatModel.patch_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVLChatModel.num_image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVLChatModel.downsample_ratio", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVLChatModel.ps_version", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVLChatModel.is_mono", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVLChatModel.img_context_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVLChatModel.video_context_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVLChatModel.visual_token_mask", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVLChatModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVLChatModel.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVLChatModel.mlp1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InternVLChatModel.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 69, "n_typed": 48, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 20, "n_method_overloads": 20, "n_method_params": 33, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.internvl.BaseInternVLMultiModalProcessor", "methods": [ { "kind": "function", "name": "BaseInternVLMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaseInternVLMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseInternVLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.internvl.InternVLDummyInputsBuilder", "methods": [ { "kind": "function", "name": "InternVLDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InternVLDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.internvl.get_internvl_target_ratios", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.internvl.InternVLImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "InternVLImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InternVLImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.internvl.resolve_internvl_min_max_num", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.internvl.InternVLVideoPixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "InternVLVideoPixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InternVLVideoPixelInputs.pixel_values_flat", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InternVLVideoPixelInputs.num_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.internvl.find_closest_aspect_ratio", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.models.internvl.dynamic_preprocess_internvl", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.model_executor.models.internvl.IMAGENET_STD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.internvl.IMAGENET_MEAN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.models.internvl.image_to_pixel_values_internvl", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.model_executor.models.internvl.IMG_START", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.internvl", "names": [ "vllm.model_executor.models.internvl.BaseInternVLDummyInputsBuilder", "vllm.model_executor.models.internvl.BaseInternVLMultiModalProcessor", "vllm.model_executor.models.internvl.BaseInternVLProcessingInfo", "vllm.model_executor.models.internvl.BaseInternVLProcessor", "vllm.model_executor.models.internvl.IMAGENET_MEAN", "vllm.model_executor.models.internvl.IMAGENET_STD", "vllm.model_executor.models.internvl.IMG_CONTEXT", "vllm.model_executor.models.internvl.IMG_END", "vllm.model_executor.models.internvl.IMG_START", "vllm.model_executor.models.internvl.InternVLChatModel", "vllm.model_executor.models.internvl.InternVLDummyInputsBuilder", "vllm.model_executor.models.internvl.InternVLImageEmbeddingInputs", "vllm.model_executor.models.internvl.InternVLImageInputs", "vllm.model_executor.models.internvl.InternVLImagePixelInputs", "vllm.model_executor.models.internvl.InternVLMultiModalProcessor", "vllm.model_executor.models.internvl.InternVLProcessingInfo", "vllm.model_executor.models.internvl.InternVLProcessor", "vllm.model_executor.models.internvl.InternVLVideoEmbeddingInputs", "vllm.model_executor.models.internvl.InternVLVideoInputs", "vllm.model_executor.models.internvl.InternVLVideoPixelInputs", "vllm.model_executor.models.internvl.build_transform", "vllm.model_executor.models.internvl.calculate_internvl_targets", "vllm.model_executor.models.internvl.dynamic_preprocess_internvl", "vllm.model_executor.models.internvl.find_closest_aspect_ratio", "vllm.model_executor.models.internvl.get_internvl_target_ratios", "vllm.model_executor.models.internvl.image_to_pixel_values_internvl", "vllm.model_executor.models.internvl.resolve_internvl_min_max_num", "vllm.model_executor.models.internvl.video_to_pixel_values_internvl" ], "n_typable": 257, "n_typed": 223, "n_any": 0, "n_untyped": 34, "n_functions": 8, "n_function_overloads": 8, "n_function_params": 31, "n_methods": 54, "n_method_overloads": 54, "n_method_params": 122, "n_classes": 13, "n_attrs": 43, "n_properties": 5, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/iquest_loopcoder.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.iquest_loopcoder.LoopCoderAttention", "methods": [ { "kind": "function", "name": "LoopCoderAttention.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "LoopCoderAttention.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LoopCoderAttention.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.dual_chunk_attention_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.loop_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.loop_window_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 17, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 15, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.iquest_loopcoder.IQuestLoopCoderModel", "methods": [ { "kind": "function", "name": "IQuestLoopCoderModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "IQuestLoopCoderModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IQuestLoopCoderModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "IQuestLoopCoderModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "IQuestLoopCoderModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IQuestLoopCoderModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IQuestLoopCoderModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IQuestLoopCoderModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IQuestLoopCoderModel.loop_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IQuestLoopCoderModel.window_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IQuestLoopCoderModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 12, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.iquest_loopcoder.LoopCoderDecoderLayer", "methods": [ { "kind": "function", "name": "LoopCoderDecoderLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LoopCoderDecoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LoopCoderDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderDecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopCoderDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.iquest_loopcoder.IQuestLoopCoderForCausalLM", "methods": [ { "kind": "function", "name": "IQuestLoopCoderForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "IQuestLoopCoderForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IQuestLoopCoderForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "IQuestLoopCoderForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IQuestLoopCoderForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "IQuestLoopCoderForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IQuestLoopCoderForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IQuestLoopCoderForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IQuestLoopCoderForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IQuestLoopCoderForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 13, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.iquest_loopcoder.LoopGateProjection", "methods": [ { "kind": "function", "name": "LoopGateProjection.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LoopGateProjection.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LoopGateProjection.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopGateProjection.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopGateProjection.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoopGateProjection.gate_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.iquest_loopcoder", "names": [ "vllm.model_executor.models.iquest_loopcoder.IQuestLoopCoderForCausalLM", "vllm.model_executor.models.iquest_loopcoder.IQuestLoopCoderModel", "vllm.model_executor.models.iquest_loopcoder.LoopCoderAttention", "vllm.model_executor.models.iquest_loopcoder.LoopCoderDecoderLayer", "vllm.model_executor.models.iquest_loopcoder.LoopGateProjection" ], "n_typable": 101, "n_typed": 59, "n_any": 0, "n_untyped": 42, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 47, "n_classes": 5, "n_attrs": 39, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/isaac.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.isaac.IsaacForConditionalGeneration", "methods": [ { "kind": "function", "name": "IsaacForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "IsaacForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "IsaacForConditionalGeneration.iter_mm_grid_hw", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "IsaacForConditionalGeneration.get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "IsaacForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IsaacForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IsaacForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IsaacForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "IsaacForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IsaacForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IsaacForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "IsaacForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IsaacForConditionalGeneration.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IsaacForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacForConditionalGeneration.vision_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacForConditionalGeneration.vision_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 28, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 18, "n_attrs": 8, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.isaac.create_cumulative_seq_lengths", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.isaac.prepare_image_tensor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.isaac.pixel_shuffle_varlen", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.models.isaac.create_pixel_shuffle_index_map", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.isaac.IsaacProcessor", "methods": [ { "kind": "function", "name": "IsaacProcessor.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "IsaacProcessor.__call__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "IsaacProcessor.apply_chat_template", "n_typed": 3, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "IsaacProcessor.image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacProcessor.image_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacProcessor.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 4, "n_any": 1, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.isaac.patchify_vision", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.isaac.Siglip2Encoder", "methods": [ { "kind": "function", "name": "Siglip2Encoder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Siglip2Encoder.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2Encoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Encoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.isaac.Siglip2EncoderLayer", "methods": [ { "kind": "function", "name": "Siglip2EncoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Siglip2EncoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2EncoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2EncoderLayer.layer_norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2EncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2EncoderLayer.layer_norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2EncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.isaac.Siglip2VariableSequenceEmbeddings", "methods": [ { "kind": "function", "name": "Siglip2VariableSequenceEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Siglip2VariableSequenceEmbeddings.positional_embeddings", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Siglip2VariableSequenceEmbeddings.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2VariableSequenceEmbeddings.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VariableSequenceEmbeddings.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VariableSequenceEmbeddings.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VariableSequenceEmbeddings.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VariableSequenceEmbeddings.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VariableSequenceEmbeddings.position_embedding_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VariableSequenceEmbeddings.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 4, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.isaac.IsaacDummyInputsBuilder", "methods": [ { "kind": "function", "name": "IsaacDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IsaacDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.isaac.IsaacImageProcessor", "methods": [ { "kind": "function", "name": "IsaacImageProcessor.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IsaacImageProcessor.preprocess", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "IsaacImageProcessor.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacImageProcessor.max_num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IsaacImageProcessor.min_num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IsaacImageProcessor.pixel_shuffle_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacImageProcessor.valid_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IsaacImageProcessor.model_input_names", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IsaacImageProcessor.vision_max_num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacImageProcessor.vision_min_num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 4, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.isaac.Siglip2VisionTransformer", "methods": [ { "kind": "function", "name": "Siglip2VisionTransformer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Siglip2VisionTransformer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Siglip2VisionTransformer.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2VisionTransformer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionTransformer.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionTransformer.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionTransformer.pixel_shuffle_scale_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionTransformer.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionTransformer.post_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 7, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.isaac.get_image_size_for_max_num_patches", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "attr", "name": "vllm.model_executor.models.isaac.VISION_MEAN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.isaac.IsaacImageProcessorKwargs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "IsaacImageProcessorKwargs.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IsaacImageProcessorKwargs.max_num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IsaacImageProcessorKwargs.min_num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IsaacImageProcessorKwargs.pixel_shuffle_scale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.isaac.IsaacMultiModalProcessor", "methods": [ { "kind": "function", "name": "IsaacMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "IsaacMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.isaac.IsaacProcessingInfo", "methods": [ { "kind": "function", "name": "IsaacProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "IsaacProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IsaacProcessingInfo.get_tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "IsaacProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "IsaacProcessingInfo.get_image_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IsaacProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "IsaacProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.isaac.VISION_SCALE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.isaac.IsaacVisionEmbedding", "methods": [ { "kind": "function", "name": "IsaacVisionEmbedding.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "IsaacVisionEmbedding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "IsaacVisionEmbedding.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacVisionEmbedding.linear_fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacVisionEmbedding.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacVisionEmbedding.linear_fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.isaac.VISION_STD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.isaac.MAX_PIXELS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.models.isaac.extract_image_pil", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.isaac.process_vision_for_patches", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.isaac.Siglip2VisionAttention", "methods": [ { "kind": "function", "name": "Siglip2VisionAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Siglip2VisionAttention.split_qkv", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Siglip2VisionAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2VisionAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionAttention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionAttention.hidden_size_per_attention_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionAttention.num_attention_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 10, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.isaac.IsaacImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "IsaacImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "IsaacImagePixelInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.isaac", "names": [ "vllm.model_executor.models.isaac.IsaacDummyInputsBuilder", "vllm.model_executor.models.isaac.IsaacForConditionalGeneration", "vllm.model_executor.models.isaac.IsaacImagePixelInputs", "vllm.model_executor.models.isaac.IsaacImageProcessor", "vllm.model_executor.models.isaac.IsaacImageProcessorKwargs", "vllm.model_executor.models.isaac.IsaacMultiModalProcessor", "vllm.model_executor.models.isaac.IsaacProcessingInfo", "vllm.model_executor.models.isaac.IsaacProcessor", "vllm.model_executor.models.isaac.IsaacVisionEmbedding", "vllm.model_executor.models.isaac.MAX_PIXELS", "vllm.model_executor.models.isaac.Siglip2Encoder", "vllm.model_executor.models.isaac.Siglip2EncoderLayer", "vllm.model_executor.models.isaac.Siglip2VariableSequenceEmbeddings", "vllm.model_executor.models.isaac.Siglip2VisionAttention", "vllm.model_executor.models.isaac.Siglip2VisionTransformer", "vllm.model_executor.models.isaac.VISION_MEAN", "vllm.model_executor.models.isaac.VISION_SCALE", "vllm.model_executor.models.isaac.VISION_STD", "vllm.model_executor.models.isaac.create_cumulative_seq_lengths", "vllm.model_executor.models.isaac.create_pixel_shuffle_index_map", "vllm.model_executor.models.isaac.extract_image_pil", "vllm.model_executor.models.isaac.get_image_size_for_max_num_patches", "vllm.model_executor.models.isaac.patchify_vision", "vllm.model_executor.models.isaac.pixel_shuffle_varlen", "vllm.model_executor.models.isaac.prepare_image_tensor", "vllm.model_executor.models.isaac.process_vision_for_patches" ], "n_typable": 200, "n_typed": 137, "n_any": 1, "n_untyped": 62, "n_functions": 8, "n_function_overloads": 8, "n_function_params": 26, "n_methods": 42, "n_method_overloads": 42, "n_method_params": 78, "n_classes": 14, "n_attrs": 60, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/jais.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.jais.JAISBlock", "methods": [ { "kind": "function", "name": "JAISBlock.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "JAISBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JAISBlock.ln_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISBlock.ln_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.jais.JAISLMHeadModel", "methods": [ { "kind": "function", "name": "JAISLMHeadModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "JAISLMHeadModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "JAISLMHeadModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "JAISLMHeadModel.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "JAISLMHeadModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JAISLMHeadModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISLMHeadModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISLMHeadModel.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISLMHeadModel.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISLMHeadModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISLMHeadModel.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISLMHeadModel.output_logits_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 13, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.jais.JAISModel", "methods": [ { "kind": "function", "name": "JAISModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "JAISModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "JAISModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JAISModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISModel.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISModel.wte", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISModel.wpe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISModel.ln_f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISModel.embeddings_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 9, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.jais.SwiGLUActivation", "methods": [ { "kind": "function", "name": "SwiGLUActivation.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.jais.JAISMLP", "methods": [ { "kind": "function", "name": "JAISMLP.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "JAISMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JAISMLP.swiglu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISMLP.c_fc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISMLP.c_fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISMLP.c_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 6, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.jais.JAISAttention", "methods": [ { "kind": "function", "name": "JAISAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "JAISAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JAISAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISAttention.attn_scale_power", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISAttention.c_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISAttention.c_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 6, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.jais", "names": [ "vllm.model_executor.models.jais.JAISAttention", "vllm.model_executor.models.jais.JAISBlock", "vllm.model_executor.models.jais.JAISLMHeadModel", "vllm.model_executor.models.jais.JAISMLP", "vllm.model_executor.models.jais.JAISModel", "vllm.model_executor.models.jais.SwiGLUActivation" ], "n_typable": 79, "n_typed": 43, "n_any": 0, "n_untyped": 36, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 33, "n_classes": 6, "n_attrs": 31, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/jais2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.jais2.Jais2DecoderLayer", "methods": [ { "kind": "function", "name": "Jais2DecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Jais2DecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Jais2DecoderLayer.get_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Jais2DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.jais2.Jais2MLP", "methods": [ { "kind": "function", "name": "Jais2MLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Jais2MLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Jais2MLP.up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2MLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2MLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.jais2.Jais2ForCausalLM", "methods": [ { "kind": "function", "name": "Jais2ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Jais2ForCausalLM._init_model", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Jais2ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Jais2ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Jais2ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Jais2ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Jais2ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Jais2ForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Jais2ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 15, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 11, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.jais2.Jais2Model", "methods": [ { "kind": "function", "name": "Jais2Model.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Jais2Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Jais2Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Jais2Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Jais2Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Model.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Model.org_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 12, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.jais2.Jais2Attention", "methods": [ { "kind": "function", "name": "Jais2Attention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "Jais2Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Jais2Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Attention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Jais2Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 13, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 14, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.jais2", "names": [ "vllm.model_executor.models.jais2.Jais2Attention", "vllm.model_executor.models.jais2.Jais2DecoderLayer", "vllm.model_executor.models.jais2.Jais2ForCausalLM", "vllm.model_executor.models.jais2.Jais2MLP", "vllm.model_executor.models.jais2.Jais2Model" ], "n_typable": 96, "n_typed": 57, "n_any": 0, "n_untyped": 39, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 45, "n_classes": 5, "n_attrs": 36, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/jamba.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.jamba.JambaMambaDecoderLayer", "methods": [ { "kind": "function", "name": "JambaMambaDecoderLayer.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "JambaMambaDecoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JambaMambaDecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaMambaDecoderLayer.is_lora_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaMambaDecoderLayer.mamba", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaMambaDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaMambaDecoderLayer.pre_ff_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaMambaDecoderLayer.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 10, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.jamba.JambaForCausalLM", "methods": [ { "kind": "function", "name": "JambaForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "JambaForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "JambaForCausalLM.forward", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "JambaForCausalLM.copy_inputs_before_cuda_graphs", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "JambaForCausalLM.get_seqlen_agnostic_capture_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "JambaForCausalLM.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "JambaForCausalLM.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "JambaForCausalLM.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "JambaForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "JambaForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "JambaForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JambaForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "JambaForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "JambaForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaForCausalLM.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaForCausalLM.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 19, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 15, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.jamba.JambaAttentionDecoderLayer", "methods": [ { "kind": "function", "name": "JambaAttentionDecoderLayer.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "JambaAttentionDecoderLayer.self_attention", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "JambaAttentionDecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JambaAttentionDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaAttentionDecoderLayer.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaAttentionDecoderLayer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaAttentionDecoderLayer.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaAttentionDecoderLayer.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaAttentionDecoderLayer.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaAttentionDecoderLayer.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaAttentionDecoderLayer.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaAttentionDecoderLayer.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaAttentionDecoderLayer.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaAttentionDecoderLayer.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaAttentionDecoderLayer.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaAttentionDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaAttentionDecoderLayer.pre_ff_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaAttentionDecoderLayer.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 13, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 14, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.jamba.JambaMoE", "methods": [ { "kind": "function", "name": "JambaMoE.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "JambaMoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JambaMoE.num_total_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaMoE.top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaMoE.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaMoE.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaMoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaMoE.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 9, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.jamba.JambaModel", "methods": [ { "kind": "function", "name": "JambaModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "JambaModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "JambaModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "JambaModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "JambaModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JambaModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaModel.final_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 12, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.jamba.JambaForSequenceClassification", "methods": [ { "kind": "function", "name": "JambaForSequenceClassification.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JambaForSequenceClassification.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "JambaForSequenceClassification.score", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaForSequenceClassification.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.jamba.ALL_DECODER_LAYER_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.jamba", "names": [ "vllm.model_executor.models.jamba.ALL_DECODER_LAYER_TYPES", "vllm.model_executor.models.jamba.JambaAttentionDecoderLayer", "vllm.model_executor.models.jamba.JambaForCausalLM", "vllm.model_executor.models.jamba.JambaForSequenceClassification", "vllm.model_executor.models.jamba.JambaMambaDecoderLayer", "vllm.model_executor.models.jamba.JambaMoE", "vllm.model_executor.models.jamba.JambaModel" ], "n_typable": 125, "n_typed": 65, "n_any": 0, "n_untyped": 60, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 24, "n_method_overloads": 24, "n_method_params": 58, "n_classes": 6, "n_attrs": 47, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/jina_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.jina_vl.JinaVLForSequenceClassification", "methods": [ { "kind": "function", "name": "JinaVLForSequenceClassification.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "JinaVLForSequenceClassification.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "JinaVLForSequenceClassification.get_score_template", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "JinaVLForSequenceClassification.post_process_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "JinaVLForSequenceClassification.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "JinaVLForSequenceClassification.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JinaVLForSequenceClassification.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "JinaVLForSequenceClassification.weight_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JinaVLForSequenceClassification.score", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JinaVLForSequenceClassification.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 17, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 13, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.jina_vl.JinaVLMultiModalProcessor", "methods": [ { "kind": "function", "name": "JinaVLMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.jina_vl.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.jina_vl.JinaVLScorer", "methods": [ { "kind": "function", "name": "JinaVLScorer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "JinaVLScorer.forward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JinaVLScorer.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JinaVLScorer.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 2, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.jina_vl", "names": [ "vllm.model_executor.models.jina_vl.JinaVLForSequenceClassification", "vllm.model_executor.models.jina_vl.JinaVLMultiModalProcessor", "vllm.model_executor.models.jina_vl.JinaVLScorer", "vllm.model_executor.models.jina_vl.logger" ], "n_typable": 36, "n_typed": 24, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 21, "n_classes": 3, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/kanana_v.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.kanana_v.KananaVMultiModalProcessor", "methods": [ { "kind": "function", "name": "KananaVMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KananaVMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KananaVMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "KananaVMultiModalProcessor.media_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 13, "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 1 }, { "kind": "function", "name": "vllm.model_executor.models.kanana_v.build_mlp", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.models.kanana_v.KananaVProcessingInfo", "methods": [ { "kind": "function", "name": "KananaVProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KananaVProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KananaVProcessingInfo._get_vision_info", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KananaVProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kanana_v.KananaVDummyInputsBuilder", "methods": [ { "kind": "function", "name": "KananaVDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KananaVDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kanana_v.KananaVForConditionalGeneration", "methods": [ { "kind": "function", "name": "KananaVForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KananaVForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KananaVForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KananaVForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KananaVForConditionalGeneration._get_visual_feature_at", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KananaVForConditionalGeneration.forward_vision", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KananaVForConditionalGeneration.forward_projector", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KananaVForConditionalGeneration.forward_and_project_vision", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KananaVForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KananaVForConditionalGeneration.forward", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "KananaVForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KananaVForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KananaVForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KananaVForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KananaVForConditionalGeneration.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KananaVForConditionalGeneration.abstractor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KananaVForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 39, "n_typed": 31, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 22, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kanana_v.KananaVImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KananaVImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KananaVImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KananaVImagePixelInputs.vision_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kanana_v.PatchMerge", "methods": [ { "kind": "function", "name": "PatchMerge.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PatchMerge.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PatchMerge.merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.kanana_v.build_pos_embeds", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.models.kanana_v.DynamicCAbstractor", "methods": [ { "kind": "function", "name": "DynamicCAbstractor.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DynamicCAbstractor._load_from_state_dict", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DynamicCAbstractor.build_net", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DynamicCAbstractor.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DynamicCAbstractor._forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DynamicCAbstractor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DynamicCAbstractor.merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DynamicCAbstractor.pos_emb_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DynamicCAbstractor.num_input_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DynamicCAbstractor.pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 12, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.kanana_v.KananaVImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.kanana_v.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.kanana_v.CustomQwen2VLVE", "methods": [ { "kind": "function", "name": "CustomQwen2VLVE.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CustomQwen2VLVE._from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CustomQwen2VLVE.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CustomQwen2VLVE.get_num_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.kanana_v", "names": [ "vllm.model_executor.models.kanana_v.CustomQwen2VLVE", "vllm.model_executor.models.kanana_v.DynamicCAbstractor", "vllm.model_executor.models.kanana_v.KananaVDummyInputsBuilder", "vllm.model_executor.models.kanana_v.KananaVForConditionalGeneration", "vllm.model_executor.models.kanana_v.KananaVImageInputs", "vllm.model_executor.models.kanana_v.KananaVImagePixelInputs", "vllm.model_executor.models.kanana_v.KananaVMultiModalProcessor", "vllm.model_executor.models.kanana_v.KananaVProcessingInfo", "vllm.model_executor.models.kanana_v.PatchMerge", "vllm.model_executor.models.kanana_v.build_mlp", "vllm.model_executor.models.kanana_v.build_pos_embeds", "vllm.model_executor.models.kanana_v.logger" ], "n_typable": 117, "n_typed": 99, "n_any": 0, "n_untyped": 18, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 6, "n_methods": 32, "n_method_overloads": 32, "n_method_params": 60, "n_classes": 8, "n_attrs": 16, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/keye.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeVideoEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KeyeVideoEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVideoEmbeddingInputs.video_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVideoEmbeddingInputs.video_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.keye.smart_resize", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeVisionEmbeddings", "methods": [ { "kind": "function", "name": "KeyeVisionEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KeyeVisionEmbeddings.interpolate_pos_encoding", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KeyeVisionEmbeddings.fetch_position_embedding_lfu_cache", "n_typed": 1, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KeyeVisionEmbeddings.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KeyeVisionEmbeddings.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVisionEmbeddings.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVisionEmbeddings.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVisionEmbeddings.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVisionEmbeddings.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVisionEmbeddings.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVisionEmbeddings.num_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVisionEmbeddings.cache_position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVisionEmbeddings.cache_position_count", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVisionEmbeddings.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVisionEmbeddings.packing_position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 11, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeForConditionalGeneration", "methods": [ { "kind": "function", "name": "KeyeForConditionalGeneration._build_projector", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KeyeForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KeyeForConditionalGeneration._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KeyeForConditionalGeneration._process_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KeyeForConditionalGeneration.get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 14, "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye.BaseKeyeModule", "methods": [ { "kind": "function", "name": "BaseKeyeModule.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseKeyeModule.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseKeyeModule._build_projector", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaseKeyeModule._process_image_input", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseKeyeModule._process_video_embeds", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseKeyeModule._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseKeyeModule.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseKeyeModule.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BaseKeyeModule.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseKeyeModule.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseKeyeModule.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseKeyeModule.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseKeyeModule.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseKeyeModule.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseKeyeModule.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseKeyeModule.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseKeyeModule.mlp_AR", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseKeyeModule.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 38, "n_typed": 30, "n_any": 1, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 21, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KeyeImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeImagePixelInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye.Projector", "methods": [ { "kind": "function", "name": "Projector.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Projector.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Projector.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Projector.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Projector.merge_kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Projector.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Projector.pre_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Projector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Projector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Projector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 7, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeSiglipEncoder", "methods": [ { "kind": "function", "name": "KeyeSiglipEncoder.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KeyeSiglipEncoder.flatten_list", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KeyeSiglipEncoder.forward", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KeyeSiglipEncoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipEncoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipEncoder.rotary_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 14, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 15, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeSiglipAttention", "methods": [ { "kind": "function", "name": "KeyeSiglipAttention.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KeyeSiglipAttention.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KeyeSiglipAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipAttention.apply_rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 9, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeMultiModalProcessor", "methods": [ { "kind": "function", "name": "KeyeMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KeyeMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.keye.KeyeVideoInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.keye.SigLIPRotaryEmbedding", "methods": [ { "kind": "function", "name": "SigLIPRotaryEmbedding.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SigLIPRotaryEmbedding.rope_init", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SigLIPRotaryEmbedding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SigLIPRotaryEmbedding.dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SigLIPRotaryEmbedding.theta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeProcessingInfo", "methods": [ { "kind": "function", "name": "KeyeProcessingInfo.get_max_image_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KeyeProcessingInfo.get_max_frame_per_video", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KeyeProcessingInfo.get_image_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KeyeProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KeyeProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KeyeProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KeyeProcessingInfo._get_vision_info", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "KeyeProcessingInfo.get_num_image_tokens", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KeyeProcessingInfo.get_num_video_tokens", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "KeyeProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KeyeProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KeyeProcessingInfo._get_max_video_frames", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KeyeProcessingInfo.get_num_frames_with_most_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KeyeProcessingInfo.get_max_video_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 35, "n_typed": 33, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 21, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.keye.apply_rotary_pos_emb_flashatt", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeBaseDummyInputsBuilder", "methods": [ { "kind": "function", "name": "KeyeBaseDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KeyeBaseDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeDummyInputsBuilder", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeSiglipVisionTransformer", "methods": [ { "kind": "function", "name": "KeyeSiglipVisionTransformer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KeyeSiglipVisionTransformer.forward", "n_typed": 17, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KeyeSiglipVisionTransformer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipVisionTransformer.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipVisionTransformer.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipVisionTransformer.post_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 20, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 20, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeSiglipEncoderLayer", "methods": [ { "kind": "function", "name": "KeyeSiglipEncoderLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KeyeSiglipEncoderLayer.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KeyeSiglipEncoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipEncoderLayer.layer_norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipEncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipEncoderLayer.layer_norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipEncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 9, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeSiglipVisionModel", "methods": [ { "kind": "function", "name": "KeyeSiglipVisionModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KeyeSiglipVisionModel.get_input_embeddings", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KeyeSiglipVisionModel.forward", "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "KeyeSiglipVisionModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "KeyeSiglipVisionModel.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "KeyeSiglipVisionModel.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "KeyeSiglipVisionModel.config_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KeyeSiglipVisionModel.main_input_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KeyeSiglipVisionModel.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeSiglipVisionModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 20, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 16, "n_attrs": 4, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KeyeImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeImageEmbeddingInputs.image_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeImageEmbeddingInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeVideoPixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KeyeVideoPixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVideoPixelInputs.pixel_values_videos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVideoPixelInputs.video_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.keye.KeyeImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.keye.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.keye.KeyeMultiModalDataParser", "methods": [ { "kind": "function", "name": "KeyeMultiModalDataParser._parse_image_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KeyeMultiModalDataParser._parse_video_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.keye", "names": [ "vllm.model_executor.models.keye.BaseKeyeModule", "vllm.model_executor.models.keye.KeyeBaseDummyInputsBuilder", "vllm.model_executor.models.keye.KeyeDummyInputsBuilder", "vllm.model_executor.models.keye.KeyeForConditionalGeneration", "vllm.model_executor.models.keye.KeyeImageEmbeddingInputs", "vllm.model_executor.models.keye.KeyeImageInputs", "vllm.model_executor.models.keye.KeyeImagePixelInputs", "vllm.model_executor.models.keye.KeyeMultiModalDataParser", "vllm.model_executor.models.keye.KeyeMultiModalProcessor", "vllm.model_executor.models.keye.KeyeProcessingInfo", "vllm.model_executor.models.keye.KeyeSiglipAttention", "vllm.model_executor.models.keye.KeyeSiglipEncoder", "vllm.model_executor.models.keye.KeyeSiglipEncoderLayer", "vllm.model_executor.models.keye.KeyeSiglipVisionModel", "vllm.model_executor.models.keye.KeyeSiglipVisionTransformer", "vllm.model_executor.models.keye.KeyeVideoEmbeddingInputs", "vllm.model_executor.models.keye.KeyeVideoInputs", "vllm.model_executor.models.keye.KeyeVideoPixelInputs", "vllm.model_executor.models.keye.KeyeVisionEmbeddings", "vllm.model_executor.models.keye.Projector", "vllm.model_executor.models.keye.SigLIPRotaryEmbedding", "vllm.model_executor.models.keye.apply_rotary_pos_emb_flashatt", "vllm.model_executor.models.keye.logger", "vllm.model_executor.models.keye.smart_resize" ], "n_typable": 293, "n_typed": 214, "n_any": 1, "n_untyped": 78, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 10, "n_methods": 58, "n_method_overloads": 58, "n_method_params": 151, "n_classes": 19, "n_attrs": 73, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/keye_vl1_5.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5MultiModalProcessor", "methods": [ { "kind": "function", "name": "KeyeVL1_5MultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KeyeVL1_5MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5ImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KeyeVL1_5ImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5ImageEmbeddingInputs.image_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5ImageEmbeddingInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5VideoPixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KeyeVL1_5VideoPixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5VideoPixelInputs.pixel_values_videos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5VideoPixelInputs.video_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5VideoPixelInputs.num_frames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5ImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5ForConditionalGeneration", "methods": [ { "kind": "function", "name": "KeyeVL1_5ForConditionalGeneration._build_projector", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KeyeVL1_5ForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KeyeVL1_5ForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KeyeVL1_5ForConditionalGeneration._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KeyeVL1_5ForConditionalGeneration._process_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KeyeVL1_5ForConditionalGeneration.get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KeyeVL1_5ForConditionalGeneration.merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 11, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5Projector", "methods": [ { "kind": "function", "name": "KeyeVL1_5Projector.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KeyeVL1_5Projector.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KeyeVL1_5Projector.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5Projector.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5Projector.merge_kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5Projector.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5Projector.pre_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5Projector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5Projector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5Projector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 7, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5MultiModalDataParser", "methods": [ { "kind": "function", "name": "KeyeVL1_5MultiModalDataParser._parse_image_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KeyeVL1_5MultiModalDataParser._parse_video_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5ProcessingInfo", "methods": [ { "kind": "function", "name": "KeyeVL1_5ProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KeyeVL1_5ProcessingInfo.get_max_frame_per_video", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KeyeVL1_5ProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5DummyInputsBuilder", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.keye_vl1_5.split_thw", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5VideoEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KeyeVL1_5VideoEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5VideoEmbeddingInputs.video_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5VideoEmbeddingInputs.video_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5VideoEmbeddingInputs.num_frames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5VideoInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.models.keye_vl1_5.get_num_patches", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5ImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KeyeVL1_5ImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5ImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KeyeVL1_5ImagePixelInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.keye_vl1_5.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.keye_vl1_5", "names": [ "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5DummyInputsBuilder", "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5ForConditionalGeneration", "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5ImageEmbeddingInputs", "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5ImageInputs", "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5ImagePixelInputs", "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5MultiModalDataParser", "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5MultiModalProcessor", "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5ProcessingInfo", "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5Projector", "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5VideoEmbeddingInputs", "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5VideoInputs", "vllm.model_executor.models.keye_vl1_5.KeyeVL1_5VideoPixelInputs", "vllm.model_executor.models.keye_vl1_5.get_num_patches", "vllm.model_executor.models.keye_vl1_5.logger", "vllm.model_executor.models.keye_vl1_5.split_thw" ], "n_typable": 70, "n_typed": 57, "n_any": 0, "n_untyped": 13, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 3, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 24, "n_classes": 10, "n_attrs": 26, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/kimi_k25.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.kimi_k25.MaxImageTokenMeta", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MaxImageTokenMeta.width", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MaxImageTokenMeta.height", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_k25.KimiK25MediaPixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiK25MediaPixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25MediaPixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25MediaPixelInputs.grid_thws", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_k25.KimiK25MultiModalProcessor", "methods": [ { "kind": "function", "name": "KimiK25MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KimiK25MultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KimiK25MultiModalProcessor.split_video_chunks", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_k25.KimiK25DummyInputsBuilder", "methods": [ { "kind": "function", "name": "KimiK25DummyInputsBuilder.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiK25DummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiK25DummyInputsBuilder.get_dummy_mm_items", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KimiK25DummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiK25DummyInputsBuilder.media_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25DummyInputsBuilder.frame_per_chunk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_k25.KimiK25ForConditionalGeneration", "methods": [ { "kind": "function", "name": "KimiK25ForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KimiK25ForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KimiK25ForConditionalGeneration._maybe_ignore_quant_config", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiK25ForConditionalGeneration._parse_and_validate_media_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiK25ForConditionalGeneration._process_media_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiK25ForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiK25ForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "KimiK25ForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KimiK25ForConditionalGeneration.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiK25ForConditionalGeneration.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KimiK25ForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25ForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25ForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25ForConditionalGeneration.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25ForConditionalGeneration.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25ForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25ForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25ForConditionalGeneration.media_placeholder", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25ForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25ForConditionalGeneration.mm_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25ForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 36, "n_typed": 23, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 16, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_k25.MoonshotKimiVAutoProcessor", "methods": [ { "kind": "function", "name": "MoonshotKimiVAutoProcessor.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MoonshotKimiVAutoProcessor.__call__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoonshotKimiVAutoProcessor.attributes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoonshotKimiVAutoProcessor.tokenizer_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoonshotKimiVAutoProcessor.media_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonshotKimiVAutoProcessor.media_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 4, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_k25.KimiK25ProcessingInfo", "methods": [ { "kind": "function", "name": "KimiK25ProcessingInfo.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiK25ProcessingInfo.get_hf_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KimiK25ProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KimiK25ProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiK25ProcessingInfo.hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25ProcessingInfo.media_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25ProcessingInfo.media_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25ProcessingInfo.hf_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25ProcessingInfo.media_tokens_calculator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 3, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 1, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.kimi_k25.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.kimi_k25", "names": [ "vllm.model_executor.models.kimi_k25.KimiK25DummyInputsBuilder", "vllm.model_executor.models.kimi_k25.KimiK25ForConditionalGeneration", "vllm.model_executor.models.kimi_k25.KimiK25MediaPixelInputs", "vllm.model_executor.models.kimi_k25.KimiK25MultiModalProcessor", "vllm.model_executor.models.kimi_k25.KimiK25ProcessingInfo", "vllm.model_executor.models.kimi_k25.MaxImageTokenMeta", "vllm.model_executor.models.kimi_k25.MoonshotKimiVAutoProcessor", "vllm.model_executor.models.kimi_k25.logger" ], "n_typable": 80, "n_typed": 48, "n_any": 0, "n_untyped": 32, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 22, "n_method_overloads": 22, "n_method_params": 34, "n_classes": 7, "n_attrs": 29, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/kimi_k25_vit.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.kimi_k25_vit.get_rope_shape_decorate", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.kimi_k25_vit.get_1d_sincos_pos_embed", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.models.kimi_k25_vit.vision_tower_forward", "n_typed": 4, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.models.kimi_k25_vit.apply_rope", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.models.kimi_k25_vit.tpool_patch_merger", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_k25_vit.KimiK25MultiModalProjector", "methods": [ { "kind": "function", "name": "KimiK25MultiModalProjector.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KimiK25MultiModalProjector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiK25MultiModalProjector.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25MultiModalProjector.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25MultiModalProjector.pre_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25MultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25MultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25MultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 6, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.kimi_k25_vit.mm_projector_forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.kimi_k25_vit.get_1d_sincos_pos_embed_from_grid", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_k25_vit.MoonVision3dPatchEmbed", "methods": [ { "kind": "function", "name": "MoonVision3dPatchEmbed.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "MoonVision3dPatchEmbed.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoonVision3dPatchEmbed.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVision3dPatchEmbed.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVision3dPatchEmbed.pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 10, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_k25_vit.MLP2", "methods": [ { "kind": "function", "name": "MLP2.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MLP2.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MLP2.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLP2.fc0", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLP2.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLP2.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 7, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_k25_vit.MoonViT3dEncoder", "methods": [ { "kind": "function", "name": "MoonViT3dEncoder.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MoonViT3dEncoder.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoonViT3dEncoder.video_attn_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViT3dEncoder.rope_2d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViT3dEncoder.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViT3dEncoder.final_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 10, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_k25_vit.Rope2DPosEmbRepeated", "methods": [ { "kind": "function", "name": "Rope2DPosEmbRepeated.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Rope2DPosEmbRepeated.extra_repr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Rope2DPosEmbRepeated._precompute_freqs_cis", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Rope2DPosEmbRepeated.get_freqs_cis", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Rope2DPosEmbRepeated.dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Rope2DPosEmbRepeated.max_height", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Rope2DPosEmbRepeated.max_width", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Rope2DPosEmbRepeated.theta_base", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 8, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_k25_vit.MoonViTEncoderLayer", "methods": [ { "kind": "function", "name": "MoonViTEncoderLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "MoonViTEncoderLayer.attention_qkvpacked", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MoonViTEncoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoonViTEncoderLayer.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTEncoderLayer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTEncoderLayer.hidden_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTEncoderLayer.hidden_size_per_attention_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTEncoderLayer.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTEncoderLayer.num_attention_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTEncoderLayer.norm0", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTEncoderLayer.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTEncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTEncoderLayer.wqkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTEncoderLayer.wo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTEncoderLayer.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 12, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 13, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_k25_vit.Learnable2DInterpPosEmbDivided_fixed", "methods": [ { "kind": "function", "name": "Learnable2DInterpPosEmbDivided_fixed.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Learnable2DInterpPosEmbDivided_fixed.reset_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Learnable2DInterpPosEmbDivided_fixed.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Learnable2DInterpPosEmbDivided_fixed.height", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Learnable2DInterpPosEmbDivided_fixed.width", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Learnable2DInterpPosEmbDivided_fixed.num_frames", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Learnable2DInterpPosEmbDivided_fixed.dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Learnable2DInterpPosEmbDivided_fixed.interpolation_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Learnable2DInterpPosEmbDivided_fixed.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 9, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.kimi_k25_vit.get_rope_shape", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.model_executor.models.kimi_k25_vit.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_k25_vit.MoonViT3dPretrainedModel", "methods": [ { "kind": "function", "name": "MoonViT3dPretrainedModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MoonViT3dPretrainedModel.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoonViT3dPretrainedModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViT3dPretrainedModel.merge_kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViT3dPretrainedModel.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViT3dPretrainedModel.merge_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViT3dPretrainedModel.patch_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViT3dPretrainedModel.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 6, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.kimi_k25_vit", "names": [ "vllm.model_executor.models.kimi_k25_vit.KimiK25MultiModalProjector", "vllm.model_executor.models.kimi_k25_vit.Learnable2DInterpPosEmbDivided_fixed", "vllm.model_executor.models.kimi_k25_vit.MLP2", "vllm.model_executor.models.kimi_k25_vit.MoonViT3dEncoder", "vllm.model_executor.models.kimi_k25_vit.MoonViT3dPretrainedModel", "vllm.model_executor.models.kimi_k25_vit.MoonViTEncoderLayer", "vllm.model_executor.models.kimi_k25_vit.MoonVision3dPatchEmbed", "vllm.model_executor.models.kimi_k25_vit.Rope2DPosEmbRepeated", "vllm.model_executor.models.kimi_k25_vit.apply_rope", "vllm.model_executor.models.kimi_k25_vit.get_1d_sincos_pos_embed", "vllm.model_executor.models.kimi_k25_vit.get_1d_sincos_pos_embed_from_grid", "vllm.model_executor.models.kimi_k25_vit.get_rope_shape", "vllm.model_executor.models.kimi_k25_vit.get_rope_shape_decorate", "vllm.model_executor.models.kimi_k25_vit.logger", "vllm.model_executor.models.kimi_k25_vit.mm_projector_forward", "vllm.model_executor.models.kimi_k25_vit.tpool_patch_merger", "vllm.model_executor.models.kimi_k25_vit.vision_tower_forward" ], "n_typable": 157, "n_typed": 82, "n_any": 2, "n_untyped": 73, "n_functions": 8, "n_function_overloads": 8, "n_function_params": 22, "n_methods": 20, "n_method_overloads": 20, "n_method_params": 61, "n_classes": 8, "n_attrs": 46, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/kimi_linear.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.kimi_linear.KimiMLAAttention", "methods": [ { "kind": "function", "name": "KimiMLAAttention.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "KimiMLAAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiMLAAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.qk_nope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.qk_rope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.qk_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.kv_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.num_local_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.use_nope", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.kv_a_proj_with_mqa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.q_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.kv_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.kv_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLAAttention.mla_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 17, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 16, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_linear.KimiLinearModel", "methods": [ { "kind": "function", "name": "KimiLinearModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KimiLinearModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiLinearModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiLinearModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 9, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.kimi_linear.get_spec_layer_idx_from_weight_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_linear.KimiLinearForCausalLM", "methods": [ { "kind": "function", "name": "KimiLinearForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KimiLinearForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiLinearForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "KimiLinearForCausalLM.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiLinearForCausalLM.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiLinearForCausalLM.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KimiLinearForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiLinearForCausalLM.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiLinearForCausalLM.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 17, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 12, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_linear.KimiDecoderLayer", "methods": [ { "kind": "function", "name": "KimiDecoderLayer.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "KimiDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDecoderLayer.is_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDecoderLayer.block_sparse_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 12, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_linear.KimiMLP", "methods": [ { "kind": "function", "name": "KimiMLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "KimiMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.kimi_linear.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_linear.KimiMoE", "methods": [ { "kind": "function", "name": "KimiMoE.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KimiMoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiMoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMoE.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMoE.num_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMoE.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiMoE.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 6, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.kimi_linear", "names": [ "vllm.model_executor.models.kimi_linear.KimiDecoderLayer", "vllm.model_executor.models.kimi_linear.KimiLinearForCausalLM", "vllm.model_executor.models.kimi_linear.KimiLinearModel", "vllm.model_executor.models.kimi_linear.KimiMLAAttention", "vllm.model_executor.models.kimi_linear.KimiMLP", "vllm.model_executor.models.kimi_linear.KimiMoE", "vllm.model_executor.models.kimi_linear.get_spec_layer_idx_from_weight_name", "vllm.model_executor.models.kimi_linear.logger" ], "n_typable": 128, "n_typed": 71, "n_any": 0, "n_untyped": 57, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 60, "n_classes": 6, "n_attrs": 46, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/kimi_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.kimi_vl.MaxImageTokenMeta", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MaxImageTokenMeta.width", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MaxImageTokenMeta.height", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_vl.KimiVLForConditionalGeneration", "methods": [ { "kind": "function", "name": "KimiVLForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KimiVLForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KimiVLForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiVLForConditionalGeneration._process_image_pixels", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiVLForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiVLForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiVLForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "KimiVLForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KimiVLForConditionalGeneration.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiVLForConditionalGeneration.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KimiVLForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLForConditionalGeneration.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLForConditionalGeneration.media_placeholder", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 24, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 16, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_vl.KimiVLImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiVLImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLImagePixelInputs.image_grid_hws", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_vl.KimiVLMultiModalProjector", "methods": [ { "kind": "function", "name": "KimiVLMultiModalProjector.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KimiVLMultiModalProjector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiVLMultiModalProjector.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLMultiModalProjector.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLMultiModalProjector.pre_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLMultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLMultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLMultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 4, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_vl.KimiVLProcessingInfo", "methods": [ { "kind": "function", "name": "KimiVLProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KimiVLProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KimiVLProcessingInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "KimiVLProcessingInfo.image_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_vl.KimiVLDummyInputsBuilder", "methods": [ { "kind": "function", "name": "KimiVLDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiVLDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.kimi_vl.KimiVLMultiModalProcessor", "methods": [ { "kind": "function", "name": "KimiVLMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KimiVLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.kimi_vl", "names": [ "vllm.model_executor.models.kimi_vl.KimiVLDummyInputsBuilder", "vllm.model_executor.models.kimi_vl.KimiVLForConditionalGeneration", "vllm.model_executor.models.kimi_vl.KimiVLImagePixelInputs", "vllm.model_executor.models.kimi_vl.KimiVLMultiModalProcessor", "vllm.model_executor.models.kimi_vl.KimiVLMultiModalProjector", "vllm.model_executor.models.kimi_vl.KimiVLProcessingInfo", "vllm.model_executor.models.kimi_vl.MaxImageTokenMeta" ], "n_typable": 67, "n_typed": 49, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 30, "n_classes": 7, "n_attrs": 21, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/lfm2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.lfm2.Lfm2Model", "methods": [ { "kind": "function", "name": "Lfm2Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Lfm2Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Lfm2Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Model.embedding_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2.Lfm2MLP", "methods": [ { "kind": "function", "name": "Lfm2MLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Lfm2MLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2MLP.w13", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MLP.w2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 9, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2.Lfm2AttentionDecoderLayer", "methods": [ { "kind": "function", "name": "Lfm2AttentionDecoderLayer.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Lfm2AttentionDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2AttentionDecoderLayer.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2AttentionDecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2AttentionDecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2AttentionDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2AttentionDecoderLayer.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2AttentionDecoderLayer.operator_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2AttentionDecoderLayer.ffn_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 11, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2.Lfm2ShortConvDecoderLayer", "methods": [ { "kind": "function", "name": "Lfm2ShortConvDecoderLayer.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Lfm2ShortConvDecoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2ShortConvDecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2ShortConvDecoderLayer.short_conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2ShortConvDecoderLayer.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2ShortConvDecoderLayer.operator_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2ShortConvDecoderLayer.ffn_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 9, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2.Lfm2Attention", "methods": [ { "kind": "function", "name": "Lfm2Attention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "Lfm2Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2Attention.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.q_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2Attention.k_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 13, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2.Lfm2ForCausalLM", "methods": [ { "kind": "function", "name": "Lfm2ForCausalLM.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2ForCausalLM.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2ForCausalLM.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Lfm2ForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Lfm2ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Lfm2ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Lfm2ForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2ForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Lfm2ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 19, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 12, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.lfm2", "names": [ "vllm.model_executor.models.lfm2.Lfm2Attention", "vllm.model_executor.models.lfm2.Lfm2AttentionDecoderLayer", "vllm.model_executor.models.lfm2.Lfm2ForCausalLM", "vllm.model_executor.models.lfm2.Lfm2MLP", "vllm.model_executor.models.lfm2.Lfm2Model", "vllm.model_executor.models.lfm2.Lfm2ShortConvDecoderLayer" ], "n_typable": 121, "n_typed": 72, "n_any": 0, "n_untyped": 49, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 20, "n_method_overloads": 20, "n_method_params": 58, "n_classes": 6, "n_attrs": 45, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/lfm2_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.lfm2_moe.Lfm2MoeForCausalLM", "methods": [ { "kind": "function", "name": "Lfm2MoeForCausalLM.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2MoeForCausalLM.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2MoeForCausalLM.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Lfm2MoeForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Lfm2MoeForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2MoeForCausalLM.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Lfm2MoeForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Lfm2MoeForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2MoeForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2MoeForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2MoeForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.expert_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.num_expert_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.num_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.num_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.num_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.num_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.num_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 23, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 14, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_moe.Lfm2MoeSparseMoeBlock", "methods": [ { "kind": "function", "name": "Lfm2MoeSparseMoeBlock.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Lfm2MoeSparseMoeBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2MoeSparseMoeBlock.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeSparseMoeBlock.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeSparseMoeBlock.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeSparseMoeBlock.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeSparseMoeBlock.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeSparseMoeBlock.n_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeSparseMoeBlock.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeSparseMoeBlock.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeSparseMoeBlock.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeSparseMoeBlock.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeSparseMoeBlock.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeSparseMoeBlock.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeSparseMoeBlock.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeSparseMoeBlock.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeSparseMoeBlock.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 6, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_moe.Lfm2MoeModel", "methods": [ { "kind": "function", "name": "Lfm2MoeModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Lfm2MoeModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2MoeModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Lfm2MoeModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Lfm2MoeModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2MoeModel.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeModel.embedding_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 12, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_moe.Lfm2MoeMlp", "methods": [ { "kind": "function", "name": "Lfm2MoeMlp.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Lfm2MoeMlp.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2MoeMlp.w13", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeMlp.w2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeMlp.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_moe.Lfm2MoeAttentionDecoderLayer", "methods": [ { "kind": "function", "name": "Lfm2MoeAttentionDecoderLayer.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Lfm2MoeAttentionDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2MoeAttentionDecoderLayer.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttentionDecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttentionDecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttentionDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttentionDecoderLayer.operator_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttentionDecoderLayer.ffn_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttentionDecoderLayer.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 12, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_moe.Lfm2MoeAttention", "methods": [ { "kind": "function", "name": "Lfm2MoeAttention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "Lfm2MoeAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2MoeAttention.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.q_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeAttention.k_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 13, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_moe.Lfm2MoeShortConvDecoderLayer", "methods": [ { "kind": "function", "name": "Lfm2MoeShortConvDecoderLayer.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Lfm2MoeShortConvDecoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2MoeShortConvDecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeShortConvDecoderLayer.short_conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeShortConvDecoderLayer.operator_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeShortConvDecoderLayer.ffn_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeShortConvDecoderLayer.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 10, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.lfm2_moe", "names": [ "vllm.model_executor.models.lfm2_moe.Lfm2MoeAttention", "vllm.model_executor.models.lfm2_moe.Lfm2MoeAttentionDecoderLayer", "vllm.model_executor.models.lfm2_moe.Lfm2MoeForCausalLM", "vllm.model_executor.models.lfm2_moe.Lfm2MoeMlp", "vllm.model_executor.models.lfm2_moe.Lfm2MoeModel", "vllm.model_executor.models.lfm2_moe.Lfm2MoeShortConvDecoderLayer", "vllm.model_executor.models.lfm2_moe.Lfm2MoeSparseMoeBlock" ], "n_typable": 158, "n_typed": 82, "n_any": 0, "n_untyped": 76, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 25, "n_method_overloads": 25, "n_method_params": 64, "n_classes": 7, "n_attrs": 71, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/lfm2_siglip2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.lfm2_siglip2.Siglip2Model", "methods": [ { "kind": "function", "name": "Siglip2Model.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Siglip2Model.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Siglip2Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2Model.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 13, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_siglip2.Siglip2EncoderLayer", "methods": [ { "kind": "function", "name": "Siglip2EncoderLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Siglip2EncoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2EncoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2EncoderLayer.layer_norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2EncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2EncoderLayer.layer_norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2EncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 7, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_siglip2.Siglip2VisionEmbeddings", "methods": [ { "kind": "function", "name": "Siglip2VisionEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Siglip2VisionEmbeddings.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Siglip2VisionEmbeddings.resize_positional_embeddings_packed", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2VisionEmbeddings.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionEmbeddings.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionEmbeddings.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionEmbeddings.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionEmbeddings.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionEmbeddings.position_embedding_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionEmbeddings.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 8, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_siglip2.Siglip2Encoder", "methods": [ { "kind": "function", "name": "Siglip2Encoder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Siglip2Encoder.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2Encoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Encoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_siglip2.Siglip2Attention", "methods": [ { "kind": "function", "name": "Siglip2Attention.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Siglip2Attention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2Attention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.num_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 7, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_siglip2.Siglip2MLP", "methods": [ { "kind": "function", "name": "Siglip2MLP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Siglip2MLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2MLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2MLP.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2MLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2MLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_siglip2.Siglip2VisionTransformer", "methods": [ { "kind": "function", "name": "Siglip2VisionTransformer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Siglip2VisionTransformer.get_input_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Siglip2VisionTransformer.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2VisionTransformer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionTransformer.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionTransformer.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionTransformer.post_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.lfm2_siglip2", "names": [ "vllm.model_executor.models.lfm2_siglip2.Siglip2Attention", "vllm.model_executor.models.lfm2_siglip2.Siglip2Encoder", "vllm.model_executor.models.lfm2_siglip2.Siglip2EncoderLayer", "vllm.model_executor.models.lfm2_siglip2.Siglip2MLP", "vllm.model_executor.models.lfm2_siglip2.Siglip2Model", "vllm.model_executor.models.lfm2_siglip2.Siglip2VisionEmbeddings", "vllm.model_executor.models.lfm2_siglip2.Siglip2VisionTransformer" ], "n_typable": 101, "n_typed": 60, "n_any": 0, "n_untyped": 41, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 51, "n_classes": 7, "n_attrs": 33, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/lfm2_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.lfm2_vl.Lfm2VLImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2VLImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLImagePixelInputs.spatial_shapes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLImagePixelInputs.num_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_vl.Lfm2VLMultiModalProcessor", "methods": [ { "kind": "function", "name": "Lfm2VLMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Lfm2VLMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Lfm2VLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_vl.Lfm2VLDummyInputsBuilder", "methods": [ { "kind": "function", "name": "Lfm2VLDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2VLDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_vl.Lfm2VLMultiModalProjector", "methods": [ { "kind": "function", "name": "Lfm2VLMultiModalProjector.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Lfm2VLMultiModalProjector.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2VLMultiModalProjector.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLMultiModalProjector.factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLMultiModalProjector.projector_use_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLMultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLMultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLMultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLMultiModalProjector.layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 5, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_vl.Lfm2VLProcessingInfo", "methods": [ { "kind": "function", "name": "Lfm2VLProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Lfm2VLProcessingInfo.get_hf_processor", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2VLProcessingInfo.get_image_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2VLProcessingInfo.get_default_tok_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Lfm2VLProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Lfm2VLProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Lfm2VLProcessingInfo._is_image_too_large", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Lfm2VLProcessingInfo.smart_resize", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Lfm2VLProcessingInfo._target_ratios", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Lfm2VLProcessingInfo._get_grid_layout", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Lfm2VLProcessingInfo._get_image_feature_grid_size", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Lfm2VLProcessingInfo.get_num_patches", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Lfm2VLProcessingInfo.get_image_repl", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Lfm2VLProcessingInfo.get_num_image_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 51, "n_typed": 48, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 37, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lfm2_vl.Lfm2VLForConditionalGeneration", "methods": [ { "kind": "function", "name": "Lfm2VLForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Lfm2VLForConditionalGeneration.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2VLForConditionalGeneration.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2VLForConditionalGeneration.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Lfm2VLForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Lfm2VLForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2VLForConditionalGeneration.image_pixels_to_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Lfm2VLForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2VLForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2VLForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Lfm2VLForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2VLForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Lfm2VLForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2VLForConditionalGeneration.merge_by_field_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Lfm2VLForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLForConditionalGeneration.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2VLForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 30, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 18, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.lfm2_vl", "names": [ "vllm.model_executor.models.lfm2_vl.Lfm2VLDummyInputsBuilder", "vllm.model_executor.models.lfm2_vl.Lfm2VLForConditionalGeneration", "vllm.model_executor.models.lfm2_vl.Lfm2VLImagePixelInputs", "vllm.model_executor.models.lfm2_vl.Lfm2VLMultiModalProcessor", "vllm.model_executor.models.lfm2_vl.Lfm2VLMultiModalProjector", "vllm.model_executor.models.lfm2_vl.Lfm2VLProcessingInfo" ], "n_typable": 126, "n_typed": 105, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 34, "n_method_overloads": 34, "n_method_params": 72, "n_classes": 6, "n_attrs": 21, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/lightonocr.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.lightonocr.LightOnOCRForConditionalGeneration", "methods": [ { "kind": "function", "name": "LightOnOCRForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LightOnOCRForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LightOnOCRForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LightOnOCRForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LightOnOCRForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LightOnOCRForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LightOnOCRForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LightOnOCRForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LightOnOCRForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 5, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.lightonocr.LightOnOCRMultiModalProcessor", "methods": [ { "kind": "function", "name": "LightOnOCRMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LightOnOCRMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LightOnOCRMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.lightonocr", "names": [ "vllm.model_executor.models.lightonocr.LightOnOCRForConditionalGeneration", "vllm.model_executor.models.lightonocr.LightOnOCRMultiModalProcessor" ], "n_typable": 24, "n_typed": 17, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_classes": 2, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/llama.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.llama.LlamaDecoderLayer", "methods": [ { "kind": "function", "name": "LlamaDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LlamaDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LlamaDecoderLayer.get_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlamaDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.llama.llama_model_invariants", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.llama.LlamaAttention", "methods": [ { "kind": "function", "name": "LlamaAttention.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "LlamaAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlamaAttention._init_rotary_emb", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlamaAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 18, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 15, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llama.LlamaBidirectionalModel", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llama.LlamaBidirectionalForSequenceClassification", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llama.LlamaModel", "methods": [ { "kind": "function", "name": "LlamaModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LlamaModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LlamaModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlamaModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.aux_hidden_state_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 12, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llama.LlamaForCausalLM", "methods": [ { "kind": "function", "name": "LlamaForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LlamaForCausalLM.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaForCausalLM.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LlamaForCausalLM._init_model", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LlamaForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LlamaForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlamaForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LlamaForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LlamaForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 20, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 14, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llama.LlamaMLP", "methods": [ { "kind": "function", "name": "LlamaMLP.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "LlamaMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlamaMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.llama", "names": [ "vllm.model_executor.models.llama.LlamaAttention", "vllm.model_executor.models.llama.LlamaBidirectionalForSequenceClassification", "vllm.model_executor.models.llama.LlamaBidirectionalModel", "vllm.model_executor.models.llama.LlamaDecoderLayer", "vllm.model_executor.models.llama.LlamaForCausalLM", "vllm.model_executor.models.llama.LlamaMLP", "vllm.model_executor.models.llama.LlamaModel", "vllm.model_executor.models.llama.llama_model_invariants" ], "n_typable": 114, "n_typed": 70, "n_any": 0, "n_untyped": 44, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 20, "n_method_overloads": 20, "n_method_params": 56, "n_classes": 7, "n_attrs": 35, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/llama4.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.llama4.Llama4MoE", "methods": [ { "kind": "function", "name": "Llama4MoE.custom_routing_function", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Llama4MoE.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Llama4MoE.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama4MoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.is_sequence_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.shared_expert", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.n_routed_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.n_shared_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.n_local_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4MoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 10, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llama4.Llama4Attention", "methods": [ { "kind": "function", "name": "Llama4Attention.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "Llama4Attention._get_attn_scale", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Llama4Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama4Attention.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.no_rope_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.nope", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.use_qk_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.attn_temperature_tuning", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.floor_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.attn_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.n_rep", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.qk_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 39, "n_typed": 16, "n_any": 0, "n_untyped": 23, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 13, "n_attrs": 23, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llama4.Llama4ForCausalLM", "methods": [ { "kind": "function", "name": "Llama4ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Llama4ForCausalLM.set_moe_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Llama4ForCausalLM.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Llama4ForCausalLM._init_model", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Llama4ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Llama4ForCausalLM.permute_qk_weight_for_rotary", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama4ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 16, "n_typed": 13, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 10, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llama4.Llama4Model", "methods": [ { "kind": "function", "name": "Llama4Model.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Llama4Model.load_moe_expert_weights", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Llama4Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama4Model.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4Model.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 12, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llama4.Llama4DecoderLayer", "methods": [ { "kind": "function", "name": "Llama4DecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Llama4DecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama4DecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4DecoderLayer.global_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4DecoderLayer.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 8, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.llama4.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.llama4", "names": [ "vllm.model_executor.models.llama4.Llama4Attention", "vllm.model_executor.models.llama4.Llama4DecoderLayer", "vllm.model_executor.models.llama4.Llama4ForCausalLM", "vllm.model_executor.models.llama4.Llama4MoE", "vllm.model_executor.models.llama4.Llama4Model", "vllm.model_executor.models.llama4.logger" ], "n_typable": 113, "n_typed": 59, "n_any": 0, "n_untyped": 54, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 46, "n_classes": 5, "n_attrs": 51, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/llama4_eagle.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.llama4_eagle.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.llama4_eagle.EagleLlama4ForCausalLM", "methods": [ { "kind": "function", "name": "EagleLlama4ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EagleLlama4ForCausalLM.get_language_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EagleLlama4ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EagleLlama4ForCausalLM.get_top_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EagleLlama4ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EagleLlama4ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleLlama4ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleLlama4ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleLlama4ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleLlama4ForCausalLM.embed_input_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llama4_eagle.LlamaModel", "methods": [ { "kind": "function", "name": "LlamaModel.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LlamaModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LlamaModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaModel.validate_and_update_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlamaModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.fc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 17, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": null } ], "name": "vllm.model_executor.models.llama4_eagle", "names": [ "vllm.model_executor.models.llama4_eagle.EagleLlama4ForCausalLM", "vllm.model_executor.models.llama4_eagle.LlamaModel", "vllm.model_executor.models.llama4_eagle.logger" ], "n_typable": 41, "n_typed": 29, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 20, "n_classes": 2, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/model_executor/models/llama_eagle.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.llama_eagle.LlamaDecoderLayer", "methods": [ { "kind": "function", "name": "LlamaDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LlamaDecoderLayer.get_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlamaDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llama_eagle.EagleLlamaForCausalLM", "methods": [ { "kind": "function", "name": "EagleLlamaForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EagleLlamaForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EagleLlamaForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EagleLlamaForCausalLM.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EagleLlamaForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleLlamaForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleLlamaForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llama_eagle.LlamaModel", "methods": [ { "kind": "function", "name": "LlamaModel.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LlamaModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaModel.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LlamaModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlamaModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.fc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 12, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.llama_eagle.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.llama_eagle", "names": [ "vllm.model_executor.models.llama_eagle.EagleLlamaForCausalLM", "vllm.model_executor.models.llama_eagle.LlamaDecoderLayer", "vllm.model_executor.models.llama_eagle.LlamaModel", "vllm.model_executor.models.llama_eagle.logger" ], "n_typable": 42, "n_typed": 29, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 21, "n_classes": 3, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/llama_eagle3.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.llama_eagle3.LlamaDecoderLayer", "methods": [ { "kind": "function", "name": "LlamaDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LlamaDecoderLayer.get_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaDecoderLayer._norm_before_residual", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaDecoderLayer._norm_after_residual", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaDecoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlamaDecoderLayer.hidden_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaDecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 11, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llama_eagle3.Eagle3LlamaForCausalLM", "methods": [ { "kind": "function", "name": "Eagle3LlamaForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Eagle3LlamaForCausalLM.embed_input_ids", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Eagle3LlamaForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Eagle3LlamaForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Eagle3LlamaForCausalLM.combine_hidden_states", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Eagle3LlamaForCausalLM.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Eagle3LlamaForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle3LlamaForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle3LlamaForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle3LlamaForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle3LlamaForCausalLM.draft_id_to_target_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Eagle3LlamaForCausalLM.use_parallel_drafting", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 16, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llama_eagle3.LlamaModel", "methods": [ { "kind": "function", "name": "LlamaModel.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LlamaModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LlamaModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlamaModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.use_aux_hidden_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaModel.fc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 13, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.llama_eagle3.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.llama_eagle3", "names": [ "vllm.model_executor.models.llama_eagle3.Eagle3LlamaForCausalLM", "vllm.model_executor.models.llama_eagle3.LlamaDecoderLayer", "vllm.model_executor.models.llama_eagle3.LlamaModel", "vllm.model_executor.models.llama_eagle3.logger" ], "n_typable": 64, "n_typed": 45, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 32, "n_classes": 3, "n_attrs": 17, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/llava.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.llava.LlavaDummyInputsBuilder", "methods": [ { "kind": "function", "name": "LlavaDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava.PixtralHFProcessingInfo", "methods": [ { "kind": "function", "name": "PixtralHFProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava.BaseLlavaProcessingInfo", "methods": [ { "kind": "function", "name": "BaseLlavaProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseLlavaProcessingInfo.get_vision_encoder_info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseLlavaProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseLlavaProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseLlavaProcessingInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseLlavaProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseLlavaProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava.LlavaMultiModalProcessor", "methods": [ { "kind": "function", "name": "LlavaMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava.PixtralHFImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PixtralHFImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava.MantisMultiModalProcessor", "methods": [ { "kind": "function", "name": "MantisMultiModalProcessor.apply", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava.LlavaForConditionalGeneration", "methods": [ { "kind": "function", "name": "LlavaForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaForConditionalGeneration.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaForConditionalGeneration.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LlavaForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaForConditionalGeneration._image_pixels_to_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaForConditionalGeneration._process_image_pixels", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LlavaForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LlavaForConditionalGeneration.get_num_mm_encoder_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaForConditionalGeneration.get_num_mm_connector_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LlavaForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 42, "n_typed": 35, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 20, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava.LlavaImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LlavaImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava.MantisForConditionalGeneration", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava.LlavaLikeConfig", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.llava.LlavaImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.llava.BaseLlavaMultiModalProcessor", "methods": [ { "kind": "function", "name": "BaseLlavaMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseLlavaMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava.PixtralHFMultiModalProcessor", "methods": [ { "kind": "function", "name": "PixtralHFMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PixtralHFMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PixtralHFMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava.LlavaLikeProcessor", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.llava.init_vision_tower_for_llava", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.llava.LlavaImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LlavaImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava.LlavaMultiModalProjector", "methods": [ { "kind": "function", "name": "LlavaMultiModalProjector.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "LlavaMultiModalProjector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaMultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaMultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaMultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava.MantisProcessingInfo", "methods": [ { "kind": "function", "name": "MantisProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava.LlavaProcessingInfo", "methods": [ { "kind": "function", "name": "LlavaProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.llava", "names": [ "vllm.model_executor.models.llava.BaseLlavaMultiModalProcessor", "vllm.model_executor.models.llava.BaseLlavaProcessingInfo", "vllm.model_executor.models.llava.LlavaDummyInputsBuilder", "vllm.model_executor.models.llava.LlavaForConditionalGeneration", "vllm.model_executor.models.llava.LlavaImageEmbeddingInputs", "vllm.model_executor.models.llava.LlavaImageInputs", "vllm.model_executor.models.llava.LlavaImagePixelInputs", "vllm.model_executor.models.llava.LlavaLikeConfig", "vllm.model_executor.models.llava.LlavaLikeProcessor", "vllm.model_executor.models.llava.LlavaMultiModalProcessor", "vllm.model_executor.models.llava.LlavaMultiModalProjector", "vllm.model_executor.models.llava.LlavaProcessingInfo", "vllm.model_executor.models.llava.MantisForConditionalGeneration", "vllm.model_executor.models.llava.MantisMultiModalProcessor", "vllm.model_executor.models.llava.MantisProcessingInfo", "vllm.model_executor.models.llava.PixtralHFImagePixelInputs", "vllm.model_executor.models.llava.PixtralHFMultiModalProcessor", "vllm.model_executor.models.llava.PixtralHFProcessingInfo", "vllm.model_executor.models.llava.init_vision_tower_for_llava" ], "n_typable": 113, "n_typed": 98, "n_any": 0, "n_untyped": 15, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 36, "n_method_overloads": 36, "n_method_params": 55, "n_classes": 17, "n_attrs": 18, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/llava_next.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.llava_next.LlavaNextProcessingInfo", "methods": [ { "kind": "function", "name": "LlavaNextProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LlavaNextProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaNextProcessingInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaNextProcessingInfo._get_num_unpadded_features", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LlavaNextProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 13, "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_next.LlavaNextMultiModalProcessor", "methods": [ { "kind": "function", "name": "LlavaNextMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_next.LlavaNextLikeConfig", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.llava_next.LlavaNextImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.llava_next.LlavaNextImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaNextImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_next.BaseLlavaNextMultiModalProcessor", "methods": [ { "kind": "function", "name": "BaseLlavaNextMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_next.LlavaNextForConditionalGeneration", "methods": [ { "kind": "function", "name": "LlavaNextForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaNextForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaNextForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaNextForConditionalGeneration._image_pixels_to_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaNextForConditionalGeneration._merge_image_patch_embeddings", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LlavaNextForConditionalGeneration._process_image_pixels", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaNextForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaNextForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaNextForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LlavaNextForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LlavaNextForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaNextForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaNextForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextForConditionalGeneration.select_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextForConditionalGeneration.image_newline", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 45, "n_typed": 36, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 24, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_next.LlavaNextImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaNextImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextImagePixelInputs.image_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.llava_next", "names": [ "vllm.model_executor.models.llava_next.BaseLlavaNextMultiModalProcessor", "vllm.model_executor.models.llava_next.LlavaNextForConditionalGeneration", "vllm.model_executor.models.llava_next.LlavaNextImageEmbeddingInputs", "vllm.model_executor.models.llava_next.LlavaNextImageInputs", "vllm.model_executor.models.llava_next.LlavaNextImagePixelInputs", "vllm.model_executor.models.llava_next.LlavaNextLikeConfig", "vllm.model_executor.models.llava_next.LlavaNextMultiModalProcessor", "vllm.model_executor.models.llava_next.LlavaNextProcessingInfo" ], "n_typable": 70, "n_typed": 60, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 36, "n_classes": 7, "n_attrs": 15, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/llava_next_video.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.llava_next_video.LlavaNextVideoMultiModalProcessor", "methods": [ { "kind": "function", "name": "LlavaNextVideoMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaNextVideoMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_next_video.LlavaNextVideoPixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaNextVideoPixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextVideoPixelInputs.pixel_values_videos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_next_video.LlavaNextVideoForConditionalGeneration", "methods": [ { "kind": "function", "name": "LlavaNextVideoForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaNextVideoForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaNextVideoForConditionalGeneration._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaNextVideoForConditionalGeneration._video_pixels_to_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaNextVideoForConditionalGeneration._process_video_pixels", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaNextVideoForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaNextVideoForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LlavaNextVideoForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaNextVideoForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaNextVideoForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextVideoForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextVideoForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextVideoForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextVideoForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextVideoForConditionalGeneration.vision_resampler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextVideoForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextVideoForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 24, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 16, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_next_video.LlavaNextVideoProcessingInfo", "methods": [ { "kind": "function", "name": "LlavaNextVideoProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LlavaNextVideoProcessingInfo.get_vision_encoder_info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LlavaNextVideoProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaNextVideoProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LlavaNextVideoProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LlavaNextVideoProcessingInfo._get_num_frame_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaNextVideoProcessingInfo.get_num_video_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LlavaNextVideoProcessingInfo._get_max_video_frames", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaNextVideoProcessingInfo.get_num_frames_with_most_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 18, "n_typed": 15, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_next_video.LlavaNextVideoDummyInputsBuilder", "methods": [ { "kind": "function", "name": "LlavaNextVideoDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaNextVideoDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_next_video.LlavaNextVideoPooler", "methods": [ { "kind": "function", "name": "LlavaNextVideoPooler.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaNextVideoPooler.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaNextVideoPooler.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextVideoPooler.pool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 2, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_next_video.LlavaNextMultiModalProjector", "methods": [ { "kind": "function", "name": "LlavaNextMultiModalProjector.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LlavaNextMultiModalProjector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaNextMultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextMultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaNextMultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.llava_next_video", "names": [ "vllm.model_executor.models.llava_next_video.LlavaNextMultiModalProjector", "vllm.model_executor.models.llava_next_video.LlavaNextVideoDummyInputsBuilder", "vllm.model_executor.models.llava_next_video.LlavaNextVideoForConditionalGeneration", "vllm.model_executor.models.llava_next_video.LlavaNextVideoMultiModalProcessor", "vllm.model_executor.models.llava_next_video.LlavaNextVideoPixelInputs", "vllm.model_executor.models.llava_next_video.LlavaNextVideoPooler", "vllm.model_executor.models.llava_next_video.LlavaNextVideoProcessingInfo" ], "n_typable": 82, "n_typed": 62, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 26, "n_method_overloads": 26, "n_method_params": 41, "n_classes": 7, "n_attrs": 15, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/llava_onevision.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.llava_onevision.LlavaOnevisionLikeConfig", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_onevision.LlavaOnevisionMultiModalProcessor", "methods": [ { "kind": "function", "name": "LlavaOnevisionMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaOnevisionMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LlavaOnevisionMultiModalProcessor._hf_processor_applies_updates", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LlavaOnevisionMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 17, "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.llava_onevision.LlavaOnevisionImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.llava_onevision.LlavaOnevisionMultiModalProjector", "methods": [ { "kind": "function", "name": "LlavaOnevisionMultiModalProjector.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaOnevisionMultiModalProjector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaOnevisionMultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaOnevisionMultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaOnevisionMultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 3, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_onevision.LlavaOnevisionDummyInputsBuilder", "methods": [ { "kind": "function", "name": "LlavaOnevisionDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaOnevisionDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.llava_onevision.LlavaOnevisionMultiInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.llava_onevision.LlavaOnevisionProcessingInfo", "methods": [ { "kind": "function", "name": "LlavaOnevisionProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LlavaOnevisionProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaOnevisionProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LlavaOnevisionProcessingInfo._get_num_unpadded_features", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LlavaOnevisionProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LlavaOnevisionProcessingInfo._get_num_frame_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaOnevisionProcessingInfo.get_num_video_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LlavaOnevisionProcessingInfo._get_max_video_frames", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaOnevisionProcessingInfo.get_num_frames_with_most_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaOnevisionProcessingInfo.get_max_video_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 26, "n_typed": 25, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 16, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_onevision.LlavaOnevisionForConditionalGeneration", "methods": [ { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration._image_pixels_to_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration._merge_image_patch_embeddings", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration._process_image_pixels", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration._video_pixels_to_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration._process_video_pixels", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration.apply_pooling", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlavaOnevisionForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaOnevisionForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaOnevisionForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaOnevisionForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaOnevisionForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaOnevisionForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaOnevisionForConditionalGeneration.image_newline", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaOnevisionForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlavaOnevisionForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 53, "n_typed": 41, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 29, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_onevision.LlavaOnevisionImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaOnevisionImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LlavaOnevisionImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_onevision.LlavaOnevisionImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaOnevisionImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LlavaOnevisionImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LlavaOnevisionImagePixelInputs.image_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.llava_onevision.LlavaOnevisionVideoPixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LlavaOnevisionVideoPixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LlavaOnevisionVideoPixelInputs.pixel_values_videos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.llava_onevision", "names": [ "vllm.model_executor.models.llava_onevision.LlavaOnevisionDummyInputsBuilder", "vllm.model_executor.models.llava_onevision.LlavaOnevisionForConditionalGeneration", "vllm.model_executor.models.llava_onevision.LlavaOnevisionImageEmbeddingInputs", "vllm.model_executor.models.llava_onevision.LlavaOnevisionImageInputs", "vllm.model_executor.models.llava_onevision.LlavaOnevisionImagePixelInputs", "vllm.model_executor.models.llava_onevision.LlavaOnevisionLikeConfig", "vllm.model_executor.models.llava_onevision.LlavaOnevisionMultiInputs", "vllm.model_executor.models.llava_onevision.LlavaOnevisionMultiModalProcessor", "vllm.model_executor.models.llava_onevision.LlavaOnevisionMultiModalProjector", "vllm.model_executor.models.llava_onevision.LlavaOnevisionProcessingInfo", "vllm.model_executor.models.llava_onevision.LlavaOnevisionVideoPixelInputs" ], "n_typable": 118, "n_typed": 101, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 34, "n_method_overloads": 34, "n_method_params": 64, "n_classes": 9, "n_attrs": 20, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/longcat_flash.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.longcat_flash.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.longcat_flash.FlashMLP", "methods": [ { "kind": "function", "name": "FlashMLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FlashMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.longcat_flash.FlashDecoderLayer", "methods": [ { "kind": "function", "name": "FlashDecoderLayer.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FlashDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashDecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashDecoderLayer.mlps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.longcat_flash.LongcatMoe", "methods": [ { "kind": "function", "name": "LongcatMoe.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "LongcatMoe.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LongcatMoe.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongcatMoe.rounter_params_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongcatMoe.router", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongcatMoe.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.longcat_flash.LongcatFlashForCausalLM", "methods": [ { "kind": "function", "name": "LongcatFlashForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LongcatFlashForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LongcatFlashForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LongcatFlashForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LongcatFlashForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LongcatFlashForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LongcatFlashForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LongcatFlashForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongcatFlashForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongcatFlashForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongcatFlashForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongcatFlashForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongcatFlashForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 14, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.longcat_flash.FlashModel", "methods": [ { "kind": "function", "name": "FlashModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlashModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 9, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.longcat_flash.FlashConfig", "methods": [ { "kind": "function", "name": "FlashConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 40, "n_overloads": 1, "n_typable": 40, "n_params": 39, "n_function_overloads": 1, "n_function_params": 39 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.kv_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.qk_rope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.qk_nope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.num_experts_per_tok", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.norm_topk_prob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.pretraining_tp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.rope_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.attention_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.mla_scale_q_lora", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.mla_scale_kv_lora", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.zero_expert_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.zero_expert_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashConfig.moe_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 69, "n_typed": 0, "n_any": 0, "n_untyped": 69, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 39, "n_attrs": 31, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.longcat_flash.LongcatRouter", "methods": [ { "kind": "function", "name": "LongcatRouter.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LongcatRouter.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LongcatRouter.n_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongcatRouter.classifier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongcatRouter.e_score_correction_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 4, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.longcat_flash", "names": [ "vllm.model_executor.models.longcat_flash.FlashConfig", "vllm.model_executor.models.longcat_flash.FlashDecoderLayer", "vllm.model_executor.models.longcat_flash.FlashMLP", "vllm.model_executor.models.longcat_flash.FlashModel", "vllm.model_executor.models.longcat_flash.LongcatFlashForCausalLM", "vllm.model_executor.models.longcat_flash.LongcatMoe", "vllm.model_executor.models.longcat_flash.LongcatRouter", "vllm.model_executor.models.longcat_flash.logger" ], "n_typable": 162, "n_typed": 58, "n_any": 0, "n_untyped": 104, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 86, "n_classes": 7, "n_attrs": 61, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/longcat_flash_mtp.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.longcat_flash_mtp.LongCatFlashMTP", "methods": [ { "kind": "function", "name": "LongCatFlashMTP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LongCatFlashMTP.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "LongCatFlashMTP.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LongCatFlashMTP.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LongCatFlashMTP._rewrite_spec_layer_name", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LongCatFlashMTP.get_spec_layer_idx_from_weight_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LongCatFlashMTP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongCatFlashMTP.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongCatFlashMTP.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongCatFlashMTP.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongCatFlashMTP.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 21, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 16, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.longcat_flash_mtp.LongCatMultiTokenPredictorLayer", "methods": [ { "kind": "function", "name": "LongCatMultiTokenPredictorLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LongCatMultiTokenPredictorLayer.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LongCatMultiTokenPredictorLayer.enorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongCatMultiTokenPredictorLayer.hnorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongCatMultiTokenPredictorLayer.eh_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongCatMultiTokenPredictorLayer.mtp_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongCatMultiTokenPredictorLayer.final_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.longcat_flash_mtp.LongCatMultiTokenPredictor", "methods": [ { "kind": "function", "name": "LongCatMultiTokenPredictor.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LongCatMultiTokenPredictor.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LongCatMultiTokenPredictor.mtp_start_layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongCatMultiTokenPredictor.num_mtp_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongCatMultiTokenPredictor.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongCatMultiTokenPredictor.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.longcat_flash_mtp", "names": [ "vllm.model_executor.models.longcat_flash_mtp.LongCatFlashMTP", "vllm.model_executor.models.longcat_flash_mtp.LongCatMultiTokenPredictor", "vllm.model_executor.models.longcat_flash_mtp.LongCatMultiTokenPredictorLayer" ], "n_typable": 57, "n_typed": 41, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 33, "n_classes": 3, "n_attrs": 14, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/mamba.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.mamba.MambaForCausalLM", "methods": [ { "kind": "function", "name": "MambaForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MambaForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MambaForCausalLM.forward", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MambaForCausalLM.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MambaForCausalLM.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MambaForCausalLM.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MambaForCausalLM.copy_inputs_before_cuda_graphs", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MambaForCausalLM.get_seqlen_agnostic_capture_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MambaForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MambaForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MambaForCausalLM.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaForCausalLM.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaForCausalLM.backbone", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 18, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 15, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mamba.MambaModel", "methods": [ { "kind": "function", "name": "MambaModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MambaModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MambaModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MambaModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MambaModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaModel.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaModel.norm_f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mamba.MambaDecoderLayer", "methods": [ { "kind": "function", "name": "MambaDecoderLayer.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MambaDecoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MambaDecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaDecoderLayer.is_falcon_mamba", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaDecoderLayer.is_lora_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaDecoderLayer.mixer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaDecoderLayer.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 9, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.mamba.KVCache", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.mamba", "names": [ "vllm.model_executor.models.mamba.KVCache", "vllm.model_executor.models.mamba.MambaDecoderLayer", "vllm.model_executor.models.mamba.MambaForCausalLM", "vllm.model_executor.models.mamba.MambaModel" ], "n_typable": 66, "n_typed": 38, "n_any": 0, "n_untyped": 28, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 32, "n_classes": 3, "n_attrs": 19, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/mamba2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.mamba2.Mamba2DecoderLayer", "methods": [ { "kind": "function", "name": "Mamba2DecoderLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Mamba2DecoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Mamba2DecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mamba2DecoderLayer.mixer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mamba2DecoderLayer.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mamba2.Mamba2Model", "methods": [ { "kind": "function", "name": "Mamba2Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Mamba2Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mamba2Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Mamba2Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Mamba2Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mamba2Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mamba2Model.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mamba2Model.norm_f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mamba2Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mamba2.Mamba2ForCausalLM", "methods": [ { "kind": "function", "name": "Mamba2ForCausalLM.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mamba2ForCausalLM.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mamba2ForCausalLM.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Mamba2ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Mamba2ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mamba2ForCausalLM.forward", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Mamba2ForCausalLM.copy_inputs_before_cuda_graphs", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Mamba2ForCausalLM.get_seqlen_agnostic_capture_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mamba2ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mamba2ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Mamba2ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mamba2ForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mamba2ForCausalLM.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mamba2ForCausalLM.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mamba2ForCausalLM.backbone", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mamba2ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mamba2ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mamba2ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 18, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 15, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.mamba2.KVCache", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.mamba2", "names": [ "vllm.model_executor.models.mamba2.KVCache", "vllm.model_executor.models.mamba2.Mamba2DecoderLayer", "vllm.model_executor.models.mamba2.Mamba2ForCausalLM", "vllm.model_executor.models.mamba2.Mamba2Model" ], "n_typable": 63, "n_typed": 37, "n_any": 0, "n_untyped": 26, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 31, "n_classes": 3, "n_attrs": 17, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/medusa.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.medusa.Medusa", "methods": [ { "kind": "function", "name": "Medusa.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Medusa.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Medusa.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Medusa.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Medusa.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Medusa.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Medusa.orig_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Medusa.truncated_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Medusa.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Medusa.token_map", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Medusa.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Medusa.lm_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 9, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.medusa.ResidualBlock", "methods": [ { "kind": "function", "name": "ResidualBlock.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ResidualBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ResidualBlock.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ResidualBlock.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.medusa", "names": [ "vllm.model_executor.models.medusa.Medusa", "vllm.model_executor.models.medusa.ResidualBlock" ], "n_typable": 25, "n_typed": 15, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_classes": 2, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/midashenglm.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.midashenglm.MiDashengLMModel", "methods": [ { "kind": "function", "name": "MiDashengLMModel.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiDashengLMModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiDashengLMModel._parse_and_validate_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiDashengLMModel._process_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiDashengLMModel.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiDashengLMModel.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MiDashengLMModel.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiDashengLMModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiDashengLMModel.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MiDashengLMModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiDashengLMModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiDashengLMModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiDashengLMModel.audio_encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiDashengLMModel.audio_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiDashengLMModel.decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 21, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 14, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.midashenglm.MiDashengLMDummyInputsBuilder", "methods": [ { "kind": "function", "name": "MiDashengLMDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiDashengLMDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.midashenglm.MiDashengLMProcessingInfo", "methods": [ { "kind": "function", "name": "MiDashengLMProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiDashengLMProcessingInfo.get_feature_extractor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiDashengLMProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiDashengLMProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiDashengLMProcessingInfo.get_min_audio_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiDashengLMProcessingInfo.get_max_audio_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.midashenglm.MiDashengLMMultiModalProcessor", "methods": [ { "kind": "function", "name": "MiDashengLMMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiDashengLMMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiDashengLMMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.midashenglm.DashengAttention", "methods": [ { "kind": "function", "name": "DashengAttention.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DashengAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DashengAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAttention.qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAttention.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 7, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.midashenglm.MiDashengLMAudioInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MiDashengLMAudioInputs.input_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MiDashengLMAudioInputs.audio_length", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.midashenglm.AudioProjectorSubsample", "methods": [ { "kind": "function", "name": "AudioProjectorSubsample.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "AudioProjectorSubsample.forward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AudioProjectorSubsample.k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioProjectorSubsample.net", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 5, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.midashenglm.DashengBlock", "methods": [ { "kind": "function", "name": "DashengBlock.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "DashengBlock.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DashengBlock.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengBlock.ls1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengBlock.norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengBlock.ls2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 10, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.midashenglm.calculate_mel_frames_dasheng", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "class", "name": "vllm.model_executor.models.midashenglm.DashengMlp", "methods": [ { "kind": "function", "name": "DashengMlp.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DashengMlp.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DashengMlp.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengMlp.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengMlp.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.midashenglm.AudioPatchEmbed", "methods": [ { "kind": "function", "name": "AudioPatchEmbed.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "AudioPatchEmbed.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AudioPatchEmbed.input_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioPatchEmbed.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioPatchEmbed.patch_stride", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioPatchEmbed.grid_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioPatchEmbed.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioPatchEmbed.flatten", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioPatchEmbed.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioPatchEmbed.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 9, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.midashenglm.LayerScale", "methods": [ { "kind": "function", "name": "LayerScale.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LayerScale.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LayerScale.inplace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LayerScale.gamma", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 2, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.midashenglm.DashengFrontend", "methods": [ { "kind": "function", "name": "DashengFrontend.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DashengFrontend.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DashengFrontend.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengFrontend.spectrogram_window", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DashengFrontend.melscale_fbanks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.midashenglm.DashengAudioTransformer", "methods": [ { "kind": "function", "name": "DashengAudioTransformer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DashengAudioTransformer.forward_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DashengAudioTransformer._to_mask", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DashengAudioTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DashengAudioTransformer.target_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAudioTransformer.hop_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAudioTransformer.front_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAudioTransformer.init_bn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAudioTransformer.patch_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAudioTransformer.time_pos_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAudioTransformer.freq_pos_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAudioTransformer.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengAudioTransformer.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 12, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.midashenglm", "names": [ "vllm.model_executor.models.midashenglm.AudioPatchEmbed", "vllm.model_executor.models.midashenglm.AudioProjectorSubsample", "vllm.model_executor.models.midashenglm.DashengAttention", "vllm.model_executor.models.midashenglm.DashengAudioTransformer", "vllm.model_executor.models.midashenglm.DashengBlock", "vllm.model_executor.models.midashenglm.DashengFrontend", "vllm.model_executor.models.midashenglm.DashengMlp", "vllm.model_executor.models.midashenglm.LayerScale", "vllm.model_executor.models.midashenglm.MiDashengLMAudioInputs", "vllm.model_executor.models.midashenglm.MiDashengLMDummyInputsBuilder", "vllm.model_executor.models.midashenglm.MiDashengLMModel", "vllm.model_executor.models.midashenglm.MiDashengLMMultiModalProcessor", "vllm.model_executor.models.midashenglm.MiDashengLMProcessingInfo", "vllm.model_executor.models.midashenglm.calculate_mel_frames_dasheng" ], "n_typable": 175, "n_typed": 105, "n_any": 0, "n_untyped": 70, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 6, "n_methods": 37, "n_method_overloads": 37, "n_method_params": 80, "n_classes": 13, "n_attrs": 52, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/mimo.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.mimo.MiMoModel", "methods": [ { "kind": "function", "name": "MiMoModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiMoModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.mimo.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.mimo.MiMoForCausalLM", "methods": [ { "kind": "function", "name": "MiMoForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiMoForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiMoForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 4, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.mimo", "names": [ "vllm.model_executor.models.mimo.MiMoForCausalLM", "vllm.model_executor.models.mimo.MiMoModel", "vllm.model_executor.models.mimo.logger" ], "n_typable": 19, "n_typed": 11, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_classes": 2, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/mimo_mtp.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.mimo_mtp.MiMoMultiTokenPredictor", "methods": [ { "kind": "function", "name": "MiMoMultiTokenPredictor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiMoMultiTokenPredictor.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiMoMultiTokenPredictor.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MiMoMultiTokenPredictor.compute_logits", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiMoMultiTokenPredictor.mtp_start_layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoMultiTokenPredictor.num_mtp_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoMultiTokenPredictor.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoMultiTokenPredictor.mtp_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoMultiTokenPredictor.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 14, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mimo_mtp.MiMoMTP", "methods": [ { "kind": "function", "name": "MiMoMTP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiMoMTP.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiMoMTP.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MiMoMTP.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiMoMTP.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiMoMTP.map_model_name_to_mtp_param_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiMoMTP._rewrite_spec_layer_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiMoMTP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoMTP.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoMTP.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 21, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 15, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mimo_mtp.MiMoMultiTokenPredictorLayer", "methods": [ { "kind": "function", "name": "MiMoMultiTokenPredictorLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MiMoMultiTokenPredictorLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiMoMultiTokenPredictorLayer.token_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoMultiTokenPredictorLayer.hidden_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoMultiTokenPredictorLayer.input_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoMultiTokenPredictorLayer.mtp_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoMultiTokenPredictorLayer.final_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.mimo_mtp", "names": [ "vllm.model_executor.models.mimo_mtp.MiMoMTP", "vllm.model_executor.models.mimo_mtp.MiMoMultiTokenPredictor", "vllm.model_executor.models.mimo_mtp.MiMoMultiTokenPredictorLayer" ], "n_typable": 61, "n_typed": 46, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 35, "n_classes": 3, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/mimo_v2_flash.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.mimo_v2_flash.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.mimo_v2_flash.MiMoV2FlashForCausalLM", "methods": [ { "kind": "function", "name": "MiMoV2FlashForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiMoV2FlashForCausalLM.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiMoV2FlashForCausalLM.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiMoV2FlashForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiMoV2FlashForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiMoV2FlashForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiMoV2FlashForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiMoV2FlashForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiMoV2FlashForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2FlashForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2FlashForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2FlashForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2FlashForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2FlashForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 17, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 10, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mimo_v2_flash.MiMoV2Model", "methods": [ { "kind": "function", "name": "MiMoV2Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiMoV2Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiMoV2Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiMoV2Model.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiMoV2Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiMoV2Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Model.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Model.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 12, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mimo_v2_flash.MiMoV2FlashDecoderLayer", "methods": [ { "kind": "function", "name": "MiMoV2FlashDecoderLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiMoV2FlashDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiMoV2FlashDecoderLayer.is_moe_layer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiMoV2FlashDecoderLayer.is_compressed_softmax_layer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiMoV2FlashDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2FlashDecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2FlashDecoderLayer.layer_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2FlashDecoderLayer.is_layer_sparse", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2FlashDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2FlashDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2FlashDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2FlashDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 10, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mimo_v2_flash.MiMoV2Attention", "methods": [ { "kind": "function", "name": "MiMoV2Attention.__init__", "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "MiMoV2Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiMoV2Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.layer_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.k_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.v_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.v_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.rope_theta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.attention_sink_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 20, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 18, "n_attrs": 20, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mimo_v2_flash.MiMoV2MLP", "methods": [ { "kind": "function", "name": "MiMoV2MLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MiMoV2MLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiMoV2MLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mimo_v2_flash.MiMoV2MoE", "methods": [ { "kind": "function", "name": "MiMoV2MoE.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiMoV2MoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiMoV2MoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MoE.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MoE.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MoE.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MoE.n_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MoE.is_sequence_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MoE.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MoE.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MoE.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MoE.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MoE.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MoE.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MoE.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MoE.gate_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiMoV2MoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 5, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 16, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.mimo_v2_flash", "names": [ "vllm.model_executor.models.mimo_v2_flash.MiMoV2Attention", "vllm.model_executor.models.mimo_v2_flash.MiMoV2FlashDecoderLayer", "vllm.model_executor.models.mimo_v2_flash.MiMoV2FlashForCausalLM", "vllm.model_executor.models.mimo_v2_flash.MiMoV2MLP", "vllm.model_executor.models.mimo_v2_flash.MiMoV2MoE", "vllm.model_executor.models.mimo_v2_flash.MiMoV2Model", "vllm.model_executor.models.mimo_v2_flash.logger" ], "n_typable": 137, "n_typed": 71, "n_any": 0, "n_untyped": 66, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 23, "n_method_overloads": 23, "n_method_params": 53, "n_classes": 6, "n_attrs": 61, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/minicpm.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.minicpm.MiniCPMForCausalLM", "methods": [ { "kind": "function", "name": "MiniCPMForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMForCausalLM._init_model", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMForCausalLM.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMForCausalLM.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniCPMForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MiniCPMForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MiniCPMForCausalLM.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMForCausalLM.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMForCausalLM.scale_width", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 18, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 12, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpm.MiniCPMDecoderLayer", "methods": [ { "kind": "function", "name": "MiniCPMDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniCPMDecoderLayer._init_attn_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMDecoderLayer._init_ffn_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMDecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMDecoderLayer.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMDecoderLayer.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMDecoderLayer.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMDecoderLayer.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 9, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpm.MiniCPMMoE", "methods": [ { "kind": "function", "name": "MiniCPMMoE.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "MiniCPMMoE.weight_loader", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniCPMMoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMMoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMMoE.num_total_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMMoE.top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMMoE.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMMoE.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMMoE.params_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMMoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMMoE.ws", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMMoE.w2s", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 13, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 12, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpm.MiniCPMAttention", "methods": [ { "kind": "function", "name": "MiniCPMAttention.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "MiniCPMAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 12, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpm.MiniCPMModel", "methods": [ { "kind": "function", "name": "MiniCPMModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMModel._init_layers", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniCPMModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniCPMModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMModel.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMModel.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMModel.aux_hidden_state_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 15, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpm.MiniCPMMLP", "methods": [ { "kind": "function", "name": "MiniCPMMLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MiniCPMMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.minicpm", "names": [ "vllm.model_executor.models.minicpm.MiniCPMAttention", "vllm.model_executor.models.minicpm.MiniCPMDecoderLayer", "vllm.model_executor.models.minicpm.MiniCPMForCausalLM", "vllm.model_executor.models.minicpm.MiniCPMMLP", "vllm.model_executor.models.minicpm.MiniCPMMoE", "vllm.model_executor.models.minicpm.MiniCPMModel" ], "n_typable": 135, "n_typed": 74, "n_any": 0, "n_untyped": 61, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 24, "n_method_overloads": 24, "n_method_params": 60, "n_classes": 6, "n_attrs": 53, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/minicpm3.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.minicpm3.MiniCPM3Model", "methods": [ { "kind": "function", "name": "MiniCPM3Model._init_layers", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpm3.MiniCPM3Attention", "methods": [ { "kind": "function", "name": "MiniCPM3Attention.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "MiniCPM3Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPM3Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.qk_nope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.qk_rope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.qk_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.kv_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.num_local_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.q_a_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.q_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.q_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.kv_a_proj_with_mqa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.kv_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.kv_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPM3Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 36, "n_typed": 16, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 14, "n_attrs": 20, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpm3.MiniCPM3ForCausalLM", "methods": [ { "kind": "function", "name": "MiniCPM3ForCausalLM._init_model", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPM3ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpm3.MiniCPM3DecoderLayer", "methods": [ { "kind": "function", "name": "MiniCPM3DecoderLayer._init_attn_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.minicpm3", "names": [ "vllm.model_executor.models.minicpm3.MiniCPM3Attention", "vllm.model_executor.models.minicpm3.MiniCPM3DecoderLayer", "vllm.model_executor.models.minicpm3.MiniCPM3ForCausalLM", "vllm.model_executor.models.minicpm3.MiniCPM3Model" ], "n_typable": 45, "n_typed": 22, "n_any": 0, "n_untyped": 23, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 20, "n_classes": 4, "n_attrs": 21, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/minicpm_eagle.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.minicpm_eagle.EagleMiniCPMDecoderLayer", "methods": [ { "kind": "function", "name": "EagleMiniCPMDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EagleMiniCPMDecoderLayer._init_attn_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EagleMiniCPMDecoderLayer._init_ffn_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EagleMiniCPMDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EagleMiniCPMDecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMDecoderLayer.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMDecoderLayer.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMDecoderLayer.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMDecoderLayer.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 9, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpm_eagle.EagleMiniCPMForCausalLM", "methods": [ { "kind": "function", "name": "EagleMiniCPMForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EagleMiniCPMForCausalLM._init_model", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EagleMiniCPMForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EagleMiniCPMForCausalLM.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EagleMiniCPMForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EagleMiniCPMForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EagleMiniCPMForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EagleMiniCPMForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EagleMiniCPMForCausalLM.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMForCausalLM.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMForCausalLM.scale_width", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 15, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 11, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpm_eagle.EagleMiniCPMModel", "methods": [ { "kind": "function", "name": "EagleMiniCPMModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EagleMiniCPMModel._init_layers", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "EagleMiniCPMModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EagleMiniCPMModel.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EagleMiniCPMModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EagleMiniCPMModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMModel.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMModel.fc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMModel.input_norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMModel.input_norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMModel.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMiniCPMModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 16, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_attrs": 11, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.minicpm_eagle", "names": [ "vllm.model_executor.models.minicpm_eagle.EagleMiniCPMDecoderLayer", "vllm.model_executor.models.minicpm_eagle.EagleMiniCPMForCausalLM", "vllm.model_executor.models.minicpm_eagle.EagleMiniCPMModel" ], "n_typable": 73, "n_typed": 40, "n_any": 0, "n_untyped": 33, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 31, "n_classes": 3, "n_attrs": 29, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/minicpmo.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.minicpmo.MiniCPMOProcessingInfo", "methods": [ { "kind": "function", "name": "MiniCPMOProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMOProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMOProcessingInfo.get_audio_placeholder", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniCPMOProcessingInfo.get_default_audio_pool_step", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMOProcessingInfo.get_default_audio_sampling_rate", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMOProcessingInfo.get_chunk_length", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMOProcessingInfo.get_max_audio_tokens_per_chunk", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMOProcessingInfo.get_max_audio_chunks_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMOProcessingInfo.get_max_audio_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMOProcessingInfo.get_audio_len_by_num_chunks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMOProcessingInfo.get_num_frames_with_most_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMOProcessingInfo.audio_pattern", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 17, "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmo.MiniCPMOBaseModel", "methods": [ { "kind": "function", "name": "MiniCPMOBaseModel.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMOBaseModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMOBaseModel.init_audio_module", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMOBaseModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMOBaseModel.subsequent_chunk_mask", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MiniCPMOBaseModel._get_feat_extract_output_lengths", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMOBaseModel.get_audio_hidden_states", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMOBaseModel._parse_and_validate_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMOBaseModel._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMOBaseModel._process_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMOBaseModel._process_multimodal_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMOBaseModel.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MiniCPMOBaseModel.apm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 25, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 18, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmo.MiniCPMOAudioEmbeddingItems", "methods": [ { "kind": "function", "name": "MiniCPMOAudioEmbeddingItems.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmo.MiniCPMODummyInputsBuilder", "methods": [ { "kind": "function", "name": "MiniCPMODummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMODummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmo.MiniCPMOAudioFeatureInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMOAudioFeatureInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMOAudioFeatureInputs.audio_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMOAudioFeatureInputs.audio_feature_lens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.minicpmo.MiniCPMOAudioInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmo.MiniCPMOMultiModalProcessor", "methods": [ { "kind": "function", "name": "MiniCPMOMultiModalProcessor.get_audio_prompt_texts", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniCPMOMultiModalProcessor.process_audios", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniCPMOMultiModalProcessor.process_mm_inputs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniCPMOMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniCPMOMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 19, "n_typed": 19, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 14, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmo.MiniCPMOMultiModalDataParser", "methods": [ { "kind": "function", "name": "MiniCPMOMultiModalDataParser._parse_audio_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmo.MiniCPMWhisperEncoderLayer", "methods": [ { "kind": "function", "name": "MiniCPMWhisperEncoderLayer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMWhisperEncoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMWhisperEncoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMWhisperEncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMWhisperEncoderLayer.self_attn_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMWhisperEncoderLayer.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMWhisperEncoderLayer.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMWhisperEncoderLayer.activation_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMWhisperEncoderLayer.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMWhisperEncoderLayer.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMWhisperEncoderLayer.final_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 5, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmo.MultiModalProjector", "methods": [ { "kind": "function", "name": "MultiModalProjector.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalProjector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalProjector.linear1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalProjector.relu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalProjector.linear2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 4, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmo.MiniCPMOAudioEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMOAudioEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMOAudioEmbeddingInputs.audio_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmo.MiniCPMO4_5", "methods": [ { "kind": "function", "name": "MiniCPMO4_5.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMO4_5.apm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmo.MiniCPMWhisperEncoder", "methods": [ { "kind": "function", "name": "MiniCPMWhisperEncoder.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMWhisperEncoder.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMWhisperEncoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.minicpmo.CPU_DEVICE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.minicpmo.FLAG_GEMS_CONFIG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmo.MiniCPMO2_6", "methods": [ { "kind": "function", "name": "MiniCPMO2_6.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMO2_6.apm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmo.MiniCPMO", "methods": [ { "kind": "function", "name": "MiniCPMO.__new__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMO.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.minicpmo", "names": [ "vllm.model_executor.models.minicpmo.CPU_DEVICE", "vllm.model_executor.models.minicpmo.FLAG_GEMS_CONFIG", "vllm.model_executor.models.minicpmo.MiniCPMO", "vllm.model_executor.models.minicpmo.MiniCPMO2_6", "vllm.model_executor.models.minicpmo.MiniCPMO4_5", "vllm.model_executor.models.minicpmo.MiniCPMOAudioEmbeddingInputs", "vllm.model_executor.models.minicpmo.MiniCPMOAudioEmbeddingItems", "vllm.model_executor.models.minicpmo.MiniCPMOAudioFeatureInputs", "vllm.model_executor.models.minicpmo.MiniCPMOAudioInputs", "vllm.model_executor.models.minicpmo.MiniCPMOBaseModel", "vllm.model_executor.models.minicpmo.MiniCPMODummyInputsBuilder", "vllm.model_executor.models.minicpmo.MiniCPMOMultiModalDataParser", "vllm.model_executor.models.minicpmo.MiniCPMOMultiModalProcessor", "vllm.model_executor.models.minicpmo.MiniCPMOProcessingInfo", "vllm.model_executor.models.minicpmo.MiniCPMWhisperEncoder", "vllm.model_executor.models.minicpmo.MiniCPMWhisperEncoderLayer", "vllm.model_executor.models.minicpmo.MultiModalProjector" ], "n_typable": 127, "n_typed": 98, "n_any": 0, "n_untyped": 29, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 41, "n_method_overloads": 41, "n_method_params": 63, "n_classes": 14, "n_attrs": 26, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/minicpmv.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.minicpmv.MiniCPMVImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMVImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMVImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMVImagePixelInputs.tgt_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMVImagePixelInputs.num_slices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.MiniCPMV2_0", "methods": [ { "kind": "function", "name": "MiniCPMV2_0.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMV2_0.init_llm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMV2_0.init_vision_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniCPMV2_0.init_resampler", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniCPMV2_0.get_vision_hidden_states", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMV2_0.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 17, "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.MiniCPMVProcessingInfo", "methods": [ { "kind": "function", "name": "MiniCPMVProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_image_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_model_version", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_slice_image_placeholder", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_sliced_grid", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_image_max_slice_num", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_max_video_frame_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_max_video_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_video_max_slice_num", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_video_frame_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_max_video_frames", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMVProcessingInfo.get_num_frames_with_most_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMVProcessingInfo.image_pattern", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MiniCPMVProcessingInfo.video_pattern", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 33, "n_typed": 28, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 15, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.MiniCPMVBaseModel", "methods": [ { "kind": "function", "name": "MiniCPMVBaseModel.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMVBaseModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMVBaseModel._parse_and_validate_vision_input", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMVBaseModel._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMVBaseModel._process_vision_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMVBaseModel._process_multimodal_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMVBaseModel.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMVBaseModel.forward", "n_typed": 5, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MiniCPMVBaseModel.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMVBaseModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMVBaseModel.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniCPMVBaseModel.init_llm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMVBaseModel.init_vision_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniCPMVBaseModel.init_resampler", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniCPMVBaseModel.get_vision_hidden_states", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMVBaseModel.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MiniCPMVBaseModel.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMVBaseModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMVBaseModel.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMVBaseModel.version", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMVBaseModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMVBaseModel.llm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMVBaseModel.vpm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMVBaseModel.vision_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMVBaseModel.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMVBaseModel.resampler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 52, "n_typed": 39, "n_any": 1, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 27, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.MiniCPMVDummyInputsBuilder", "methods": [ { "kind": "function", "name": "MiniCPMVDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMVDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.minicpmv.MiniCPMVImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.MiniCPMV4_0", "methods": [ { "kind": "function", "name": "MiniCPMV4_0.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMV4_0.init_llm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMV4_0.init_vision_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniCPMV4_0.init_resampler", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniCPMV4_0.get_vision_hidden_states", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMV4_0.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMV4_0.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 19, "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 13, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.minicpmv.get_version_by_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.MiniCPMV", "methods": [ { "kind": "function", "name": "MiniCPMV.__new__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.MiniCPMV2_6", "methods": [ { "kind": "function", "name": "MiniCPMV2_6.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMV2_6.init_llm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMV2_6.init_vision_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniCPMV2_6.init_resampler", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniCPMV2_6.get_vision_hidden_states", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMV2_6.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMV2_6.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 19, "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 13, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.MiniCPMVImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMVImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MiniCPMVImageEmbeddingInputs.image_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.MiniCPMV2_5", "methods": [ { "kind": "function", "name": "MiniCPMV2_5.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMV2_5.init_llm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMV2_5.init_vision_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniCPMV2_5.init_resampler", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniCPMV2_5.get_vision_hidden_states", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMV2_5.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 17, "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.Resampler4_5", "methods": [ { "kind": "function", "name": "Resampler4_5.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "Resampler4_5.get_1d_sincos_pos_embed_from_temporal_size", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Resampler4_5._set_temporal_pos_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Resampler4_5._adjust_temporal_pos_cache", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Resampler4_5._init_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Resampler4_5.forward", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Resampler4_5.max_temporal_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 21, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 19, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.MiniCPMVVideoEmbeddingItems", "methods": [ { "kind": "function", "name": "MiniCPMVVideoEmbeddingItems.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMVVideoEmbeddingItems.get_frame_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMVVideoEmbeddingItems.get_num_frames", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.Resampler2_5", "methods": [ { "kind": "function", "name": "Resampler2_5.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "Resampler2_5._set_2d_pos_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Resampler2_5._adjust_pos_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Resampler2_5.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Resampler2_5.max_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 14, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.MiniCPMVImageEmbeddingItems", "methods": [ { "kind": "function", "name": "MiniCPMVImageEmbeddingItems.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMVImageEmbeddingItems.get_image_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.MiniCPMVMultiModalDataParser", "methods": [ { "kind": "function", "name": "MiniCPMVMultiModalDataParser._parse_image_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMVMultiModalDataParser._parse_video_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.MiniCPMVMultiModalProcessor", "methods": [ { "kind": "function", "name": "MiniCPMVMultiModalProcessor.get_image_prompt_texts", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMVMultiModalProcessor.get_video_prompt_texts", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMVMultiModalProcessor.process_images", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniCPMVMultiModalProcessor.process_videos", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniCPMVMultiModalProcessor.process_mm_inputs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniCPMVMultiModalProcessor._base_call_hf_processor", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MiniCPMVMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniCPMVMultiModalProcessor._hf_processor_applies_updates", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniCPMVMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniCPMVMultiModalProcessor._recompute_cached_prompt_update", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMVMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 44, "n_typed": 44, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 33, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.minicpmv.DEFAULT_LN", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.minicpmv.MiniCPMV4_5", "methods": [ { "kind": "function", "name": "MiniCPMV4_5.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMV4_5.init_llm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniCPMV4_5.init_vision_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniCPMV4_5.init_resampler", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniCPMV4_5.get_vision_hidden_states", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniCPMV4_5.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniCPMV4_5.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 19, "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 13, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.minicpmv", "names": [ "vllm.model_executor.models.minicpmv.DEFAULT_LN", "vllm.model_executor.models.minicpmv.MiniCPMV", "vllm.model_executor.models.minicpmv.MiniCPMV2_0", "vllm.model_executor.models.minicpmv.MiniCPMV2_5", "vllm.model_executor.models.minicpmv.MiniCPMV2_6", "vllm.model_executor.models.minicpmv.MiniCPMV4_0", "vllm.model_executor.models.minicpmv.MiniCPMV4_5", "vllm.model_executor.models.minicpmv.MiniCPMVBaseModel", "vllm.model_executor.models.minicpmv.MiniCPMVDummyInputsBuilder", "vllm.model_executor.models.minicpmv.MiniCPMVImageEmbeddingInputs", "vllm.model_executor.models.minicpmv.MiniCPMVImageEmbeddingItems", "vllm.model_executor.models.minicpmv.MiniCPMVImageInputs", "vllm.model_executor.models.minicpmv.MiniCPMVImagePixelInputs", "vllm.model_executor.models.minicpmv.MiniCPMVMultiModalDataParser", "vllm.model_executor.models.minicpmv.MiniCPMVMultiModalProcessor", "vllm.model_executor.models.minicpmv.MiniCPMVProcessingInfo", "vllm.model_executor.models.minicpmv.MiniCPMVVideoEmbeddingItems", "vllm.model_executor.models.minicpmv.Resampler2_5", "vllm.model_executor.models.minicpmv.Resampler4_5", "vllm.model_executor.models.minicpmv.get_version_by_config" ], "n_typable": 300, "n_typed": 269, "n_any": 1, "n_untyped": 30, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 92, "n_method_overloads": 92, "n_method_params": 186, "n_classes": 17, "n_attrs": 28, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/minimax_m2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.minimax_m2.MiniMaxM2Model", "methods": [ { "kind": "function", "name": "MiniMaxM2Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniMaxM2Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxM2Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniMaxM2Model.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniMaxM2Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxM2Model.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MiniMaxM2Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 12, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_m2.MiniMaxM2ForCausalLM", "methods": [ { "kind": "function", "name": "MiniMaxM2ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniMaxM2ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxM2ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MiniMaxM2ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxM2ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxM2ForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxM2ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MiniMaxM2ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2ForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 14, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 10, "n_attrs": 7, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.minimax_m2.get_spec_layer_idx_from_weight_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_m2.MiniMaxM2MoE", "methods": [ { "kind": "function", "name": "MiniMaxM2MoE.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniMaxM2MoE.ebias_weight_loader", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniMaxM2MoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxM2MoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2MoE.use_routing_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2MoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2MoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2MoE.e_score_correction_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 8, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_m2.MiniMaxM2Attention", "methods": [ { "kind": "function", "name": "MiniMaxM2Attention.__init__", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "MiniMaxM2Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxM2Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Attention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Attention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2Attention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 17, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 15, "n_attrs": 16, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_m2.MiniMaxM2DecoderLayer", "methods": [ { "kind": "function", "name": "MiniMaxM2DecoderLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MiniMaxM2DecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxM2DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2DecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2DecoderLayer.block_sparse_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 10, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.minimax_m2", "names": [ "vllm.model_executor.models.minimax_m2.MiniMaxM2Attention", "vllm.model_executor.models.minimax_m2.MiniMaxM2DecoderLayer", "vllm.model_executor.models.minimax_m2.MiniMaxM2ForCausalLM", "vllm.model_executor.models.minimax_m2.MiniMaxM2MoE", "vllm.model_executor.models.minimax_m2.MiniMaxM2Model", "vllm.model_executor.models.minimax_m2.get_spec_layer_idx_from_weight_name" ], "n_typable": 106, "n_typed": 64, "n_any": 0, "n_untyped": 42, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 47, "n_classes": 5, "n_attrs": 40, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/minimax_text_01.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.minimax_text_01.weight_loader_with_alias", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_text_01.MiniMaxText01DecoderLayer", "methods": [ { "kind": "function", "name": "MiniMaxText01DecoderLayer.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "MiniMaxText01DecoderLayer.forward", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MiniMaxText01DecoderLayer.shared_moe_coefficient_loader", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxText01DecoderLayer.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.expert_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.layernorm_mlp_alpha", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.layernorm_mlp_beta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.postnorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.shared_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.layernorm_attention_alpha", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.layernorm_attention_beta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.shared_mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.coefficient", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.shared_moe_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01DecoderLayer.block_sparse_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 36, "n_typed": 18, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 16, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_text_01.MiniMaxText01Attention", "methods": [ { "kind": "function", "name": "MiniMaxText01Attention.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "MiniMaxText01Attention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxText01Attention.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Attention.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Attention.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 16, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 15, "n_attrs": 16, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_text_01.MiniMaxText01MLP", "methods": [ { "kind": "function", "name": "MiniMaxText01MLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MiniMaxText01MLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxText01MLP.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01MLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01MLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01MLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_text_01.MiniMaxText01ForCausalLM", "methods": [ { "kind": "function", "name": "MiniMaxText01ForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniMaxText01ForCausalLM.copy_inputs_before_cuda_graphs", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniMaxText01ForCausalLM.get_seqlen_agnostic_capture_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxText01ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxText01ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MiniMaxText01ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxText01ForCausalLM.make_empty_intermediate_tensors", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniMaxText01ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxText01ForCausalLM.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxText01ForCausalLM.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxText01ForCausalLM.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxText01ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01ForCausalLM.CONCAT_FFN", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01ForCausalLM.kv_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 24, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 18, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_text_01.MiniMaxText01Model", "methods": [ { "kind": "function", "name": "MiniMaxText01Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniMaxText01Model._clear_prefill_cache", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniMaxText01Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxText01Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxText01Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Model.decoder_attention_types", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Model.num_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Model.cache_shape", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Model.embed_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 10, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_text_01.MiniMaxText01MoE", "methods": [ { "kind": "function", "name": "MiniMaxText01MoE.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "MiniMaxText01MoE.gate_weight_loader", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniMaxText01MoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxText01MoE.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01MoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01MoE.num_total_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01MoE.top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01MoE.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01MoE.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01MoE.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01MoE.params_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01MoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxText01MoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 14, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 10, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.minimax_text_01.replace_weight_name", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.model_executor.models.minimax_text_01", "names": [ "vllm.model_executor.models.minimax_text_01.MiniMaxText01Attention", "vllm.model_executor.models.minimax_text_01.MiniMaxText01DecoderLayer", "vllm.model_executor.models.minimax_text_01.MiniMaxText01ForCausalLM", "vllm.model_executor.models.minimax_text_01.MiniMaxText01MLP", "vllm.model_executor.models.minimax_text_01.MiniMaxText01MoE", "vllm.model_executor.models.minimax_text_01.MiniMaxText01Model", "vllm.model_executor.models.minimax_text_01.replace_weight_name", "vllm.model_executor.models.minimax_text_01.weight_loader_with_alias" ], "n_typable": 170, "n_typed": 97, "n_any": 0, "n_untyped": 73, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 6, "n_methods": 25, "n_method_overloads": 25, "n_method_params": 77, "n_classes": 6, "n_attrs": 60, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/minimax_vl_01.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01ImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01MultiModalProjector", "methods": [ { "kind": "function", "name": "MiniMaxVL01MultiModalProjector.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MiniMaxVL01MultiModalProjector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxVL01MultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxVL01MultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxVL01MultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01DummyInputsBuilder", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01ProcessingInfo", "methods": [ { "kind": "function", "name": "MiniMaxVL01ProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MiniMaxVL01ProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxVL01ProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01ForConditionalGeneration", "methods": [ { "kind": "function", "name": "MiniMaxVL01ForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniMaxVL01ForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniMaxVL01ForConditionalGeneration._image_pixels_to_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniMaxVL01ForConditionalGeneration.pack_image_features", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MiniMaxVL01ForConditionalGeneration._process_image_pixels", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxVL01ForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxVL01ForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxVL01ForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxVL01ForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MiniMaxVL01ForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxVL01ForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxVL01ForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MiniMaxVL01ForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxVL01ForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxVL01ForConditionalGeneration.vision_feature_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxVL01ForConditionalGeneration.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxVL01ForConditionalGeneration.pad_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxVL01ForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxVL01ForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxVL01ForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxVL01ForConditionalGeneration.image_newline", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxVL01ForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 29, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 19, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01ImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxVL01ImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxVL01ImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01ImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxVL01ImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxVL01ImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxVL01ImagePixelInputs.image_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01MultiModalProcessor", "methods": [ { "kind": "function", "name": "MiniMaxVL01MultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MiniMaxVL01MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.minimax_vl_01", "names": [ "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01DummyInputsBuilder", "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01ForConditionalGeneration", "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01ImageEmbeddingInputs", "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01ImageInputs", "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01ImagePixelInputs", "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01MultiModalProcessor", "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01MultiModalProjector", "vllm.model_executor.models.minimax_vl_01.MiniMaxVL01ProcessingInfo" ], "n_typable": 70, "n_typed": 53, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 33, "n_classes": 7, "n_attrs": 20, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/mistral.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.mistral.MistralDecoderLayer", "methods": [ { "kind": "function", "name": "MistralDecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MistralDecoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MistralDecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MistralDecoderLayer.ada_rms_norm_t_cond", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mistral.MistralModel", "methods": [ { "kind": "function", "name": "MistralModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MistralModel.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mistral.MistralAttention", "methods": [ { "kind": "function", "name": "MistralAttention.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "MistralAttention._get_llama_4_attn_scale", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MistralAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MistralAttention.do_llama_4_scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MistralAttention.llama_4_scaling_original_max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MistralAttention.llama_4_scaling_beta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 17, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 14, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mistral.MistralMLP", "methods": [ { "kind": "function", "name": "MistralMLP.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "MistralMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MistralMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MistralMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MistralMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mistral.MistralForCausalLM", "methods": [ { "kind": "function", "name": "MistralForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MistralForCausalLM._init_model", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MistralForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MistralForCausalLM.maybe_remap_mistral", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MistralForCausalLM.embedding_modules", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MistralForCausalLM.mistral_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 14, "n_typed": 12, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.mistral", "names": [ "vllm.model_executor.models.mistral.MistralAttention", "vllm.model_executor.models.mistral.MistralDecoderLayer", "vllm.model_executor.models.mistral.MistralForCausalLM", "vllm.model_executor.models.mistral.MistralMLP", "vllm.model_executor.models.mistral.MistralModel" ], "n_typable": 70, "n_typed": 57, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 48, "n_classes": 5, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/mistral3.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.mistral3.LlavaLikeProcessor", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mistral3.Mistral3ForConditionalGeneration", "methods": [ { "kind": "function", "name": "Mistral3ForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Mistral3ForConditionalGeneration.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mistral3ForConditionalGeneration.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Mistral3ForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Mistral3ForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mistral3ForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mistral3ForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mistral3ForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Mistral3ForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mistral3ForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mistral3ForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Mistral3ForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Mistral3ForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mistral3ForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mistral3ForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mistral3ForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mistral3ForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mistral3ForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mistral3ForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 26, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 15, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mistral3.Mistral3ImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Mistral3ImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Mistral3ImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mistral3.Mistral3MultiModalProjector", "methods": [ { "kind": "function", "name": "Mistral3MultiModalProjector.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "Mistral3MultiModalProjector.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Mistral3MultiModalProjector.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mistral3MultiModalProjector.patch_merger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mistral3MultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mistral3MultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mistral3MultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mistral3.Mistral3MultiModalProcessor", "methods": [ { "kind": "function", "name": "Mistral3MultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Mistral3MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Mistral3MultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mistral3.BaseLlavaProcessingInfo", "methods": [ { "kind": "function", "name": "BaseLlavaProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseLlavaProcessingInfo.get_vision_encoder_info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseLlavaProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseLlavaProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseLlavaProcessingInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseLlavaProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.mistral3.init_vision_tower_for_llava", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.mistral3.Mistral3ProcessingInfo", "methods": [ { "kind": "function", "name": "Mistral3ProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mistral3.Mistral3DummyInputsBuilder", "methods": [ { "kind": "function", "name": "Mistral3DummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mistral3DummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mistral3.LlavaLikeConfig", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mistral3.Mistral3PatchMerger", "methods": [ { "kind": "function", "name": "Mistral3PatchMerger.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Mistral3PatchMerger.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Mistral3PatchMerger.vision_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mistral3PatchMerger.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mistral3PatchMerger.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Mistral3PatchMerger.merging_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.mistral3", "names": [ "vllm.model_executor.models.mistral3.BaseLlavaProcessingInfo", "vllm.model_executor.models.mistral3.LlavaLikeConfig", "vllm.model_executor.models.mistral3.LlavaLikeProcessor", "vllm.model_executor.models.mistral3.Mistral3DummyInputsBuilder", "vllm.model_executor.models.mistral3.Mistral3ForConditionalGeneration", "vllm.model_executor.models.mistral3.Mistral3ImagePixelInputs", "vllm.model_executor.models.mistral3.Mistral3MultiModalProcessor", "vllm.model_executor.models.mistral3.Mistral3MultiModalProjector", "vllm.model_executor.models.mistral3.Mistral3PatchMerger", "vllm.model_executor.models.mistral3.Mistral3ProcessingInfo", "vllm.model_executor.models.mistral3.init_vision_tower_for_llava" ], "n_typable": 97, "n_typed": 77, "n_any": 0, "n_untyped": 20, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 27, "n_method_overloads": 27, "n_method_params": 47, "n_classes": 10, "n_attrs": 19, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/mistral_large_3.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.mistral_large_3.MistralLarge3ForCausalLM", "methods": [ { "kind": "function", "name": "MistralLarge3ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MistralLarge3ForCausalLM._remap_mistral_to_ds", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MistralLarge3ForCausalLM.remapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.mistral_large_3", "names": [ "vllm.model_executor.models.mistral_large_3.MistralLarge3ForCausalLM" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/mistral_large_3_eagle.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.mistral_large_3_eagle.EagleMistralLarge3ForCausalLM", "methods": [ { "kind": "function", "name": "EagleMistralLarge3ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EagleMistralLarge3ForCausalLM.get_language_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EagleMistralLarge3ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EagleMistralLarge3ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EagleMistralLarge3ForCausalLM.remapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EagleMistralLarge3ForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMistralLarge3ForCausalLM.model_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMistralLarge3ForCausalLM.embed_input_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 13, "n_typed": 10, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.mistral_large_3_eagle.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.mistral_large_3_eagle.EagleMistralLarge3Model", "methods": [ { "kind": "function", "name": "EagleMistralLarge3Model.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EagleMistralLarge3Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EagleMistralLarge3Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMistralLarge3Model.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMistralLarge3Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMistralLarge3Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMistralLarge3Model.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMistralLarge3Model.start_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMistralLarge3Model.end_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMistralLarge3Model.fc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMistralLarge3Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleMistralLarge3Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 8, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": null } ], "name": "vllm.model_executor.models.mistral_large_3_eagle", "names": [ "vllm.model_executor.models.mistral_large_3_eagle.EagleMistralLarge3ForCausalLM", "vllm.model_executor.models.mistral_large_3_eagle.EagleMistralLarge3Model", "vllm.model_executor.models.mistral_large_3_eagle.logger" ], "n_typable": 33, "n_typed": 18, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_classes": 2, "n_attrs": 15, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/model_executor/models/mixtral.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.mixtral.MixtralAttention", "methods": [ { "kind": "function", "name": "MixtralAttention.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "MixtralAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MixtralAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 12, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mixtral.MixtralModel", "methods": [ { "kind": "function", "name": "MixtralModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MixtralModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MixtralModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MixtralModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MixtralModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MixtralModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralModel.org_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralModel.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralModel.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 12, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mixtral.MixtralForCausalLM", "methods": [ { "kind": "function", "name": "MixtralForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MixtralForCausalLM.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MixtralForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MixtralForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MixtralForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MixtralForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MixtralForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MixtralForCausalLM.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MixtralForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MixtralForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MixtralForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralForCausalLM.expert_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralForCausalLM.moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralForCausalLM.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralForCausalLM.num_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralForCausalLM.num_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralForCausalLM.num_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralForCausalLM.num_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralForCausalLM.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralForCausalLM.num_expert_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralForCausalLM.num_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 17, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 11, "n_attrs": 19, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mixtral.MixtralDecoderLayer", "methods": [ { "kind": "function", "name": "MixtralDecoderLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MixtralDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MixtralDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralDecoderLayer.block_sparse_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mixtral.MixtralMoE", "methods": [ { "kind": "function", "name": "MixtralMoE.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "MixtralMoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MixtralMoE.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralMoE.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralMoE.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralMoE.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralMoE.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralMoE.n_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralMoE.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralMoE.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralMoE.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralMoE.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralMoE.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralMoE.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralMoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MixtralMoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 12, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 14, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.mixtral", "names": [ "vllm.model_executor.models.mixtral.MixtralAttention", "vllm.model_executor.models.mixtral.MixtralDecoderLayer", "vllm.model_executor.models.mixtral.MixtralForCausalLM", "vllm.model_executor.models.mixtral.MixtralMoE", "vllm.model_executor.models.mixtral.MixtralModel" ], "n_typable": 123, "n_typed": 63, "n_any": 0, "n_untyped": 60, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 48, "n_classes": 5, "n_attrs": 60, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/mllama4.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.mllama4.Llama4VisionMLP", "methods": [ { "kind": "function", "name": "Llama4VisionMLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Llama4VisionMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama4VisionMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionMLP.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionMLP.output_activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mllama4.Llama4VisionEncoderLayer", "methods": [ { "kind": "function", "name": "Llama4VisionEncoderLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Llama4VisionEncoderLayer.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama4VisionEncoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionEncoderLayer.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionEncoderLayer.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionEncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionEncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionEncoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionEncoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 4, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mllama4.Llama4MultiModalProjector", "methods": [ { "kind": "function", "name": "Llama4MultiModalProjector.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Llama4MultiModalProjector.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama4MultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 2, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mllama4.Llama4ImagePatchInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama4ImagePatchInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ImagePatchInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ImagePatchInputs.patches_per_image", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ImagePatchInputs.aspect_ratios", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mllama4.Llama4VisionPixelShuffleMLP", "methods": [ { "kind": "function", "name": "Llama4VisionPixelShuffleMLP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Llama4VisionPixelShuffleMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama4VisionPixelShuffleMLP.pixel_shuffle_ratio", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionPixelShuffleMLP.inner_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionPixelShuffleMLP.output_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionPixelShuffleMLP.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 4, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mllama4.Mllama4MultiModalProcessor", "methods": [ { "kind": "function", "name": "Mllama4MultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Mllama4MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Mllama4MultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mllama4.Llama4UnfoldConvolution", "methods": [ { "kind": "function", "name": "Llama4UnfoldConvolution.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Llama4UnfoldConvolution.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama4UnfoldConvolution.unfold", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4UnfoldConvolution.linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mllama4.Llama4VisionAttention", "methods": [ { "kind": "function", "name": "Llama4VisionAttention.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Llama4VisionAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama4VisionAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionAttention.num_local_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionAttention.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 5, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mllama4.Llama4VisionEncoder", "methods": [ { "kind": "function", "name": "Llama4VisionEncoder.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Llama4VisionEncoder.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama4VisionEncoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionEncoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mllama4.Mllama4ProcessingInfo", "methods": [ { "kind": "function", "name": "Mllama4ProcessingInfo.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mllama4ProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Mllama4ProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mllama4ProcessingInfo.get_default_tok_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Mllama4ProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Mllama4ProcessingInfo.get_patch_per_chunk", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mllama4ProcessingInfo.get_max_num_tiles", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Mllama4ProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mllama4.Llama4VisionModel", "methods": [ { "kind": "function", "name": "Llama4VisionModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Llama4VisionModel.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama4VisionModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionModel.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionModel.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionModel.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionModel.num_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionModel.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionModel.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionModel.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionModel.class_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionModel.positional_embedding_vlm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionModel.layernorm_pre", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionModel.layernorm_post", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionModel.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4VisionModel.vision_adapter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 5, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mllama4.Llama4ForConditionalGeneration", "methods": [ { "kind": "function", "name": "Llama4ForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Llama4ForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Llama4ForConditionalGeneration.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Llama4ForConditionalGeneration.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Llama4ForConditionalGeneration.set_eplb_state", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Llama4ForConditionalGeneration.update_physical_experts_metadata", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Llama4ForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Llama4ForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Llama4ForConditionalGeneration.embed_multimodal", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Llama4ForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Llama4ForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Llama4ForConditionalGeneration.separate_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Llama4ForConditionalGeneration._consolidate_qkv_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Llama4ForConditionalGeneration._rename_weight_for_modelopt_checkpoint", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Llama4ForConditionalGeneration._separate_and_rename_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Llama4ForConditionalGeneration._handle_expert_scale_broadcasting", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Llama4ForConditionalGeneration._load_other_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Llama4ForConditionalGeneration.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Llama4ForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Llama4ForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Llama4ForConditionalGeneration.get_num_mm_encoder_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Llama4ForConditionalGeneration.get_num_mm_connector_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama4ForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.num_expert_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.num_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.num_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.num_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.num_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.num_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama4ForConditionalGeneration.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 72, "n_typed": 50, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 22, "n_method_overloads": 22, "n_method_params": 32, "n_attrs": 20, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.mllama4.pixel_shuffle", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.mllama4.Mllama4DummyInputsBuilder", "methods": [ { "kind": "function", "name": "Mllama4DummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Mllama4DummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.mllama4", "names": [ "vllm.model_executor.models.mllama4.Llama4ForConditionalGeneration", "vllm.model_executor.models.mllama4.Llama4ImagePatchInputs", "vllm.model_executor.models.mllama4.Llama4MultiModalProjector", "vllm.model_executor.models.mllama4.Llama4UnfoldConvolution", "vllm.model_executor.models.mllama4.Llama4VisionAttention", "vllm.model_executor.models.mllama4.Llama4VisionEncoder", "vllm.model_executor.models.mllama4.Llama4VisionEncoderLayer", "vllm.model_executor.models.mllama4.Llama4VisionMLP", "vllm.model_executor.models.mllama4.Llama4VisionModel", "vllm.model_executor.models.mllama4.Llama4VisionPixelShuffleMLP", "vllm.model_executor.models.mllama4.Mllama4DummyInputsBuilder", "vllm.model_executor.models.mllama4.Mllama4MultiModalProcessor", "vllm.model_executor.models.mllama4.Mllama4ProcessingInfo", "vllm.model_executor.models.mllama4.pixel_shuffle" ], "n_typable": 208, "n_typed": 122, "n_any": 0, "n_untyped": 86, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 51, "n_method_overloads": 51, "n_method_params": 84, "n_classes": 13, "n_attrs": 72, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/mlp_speculator.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.mlp_speculator.SQRT2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mlp_speculator.MLPSpeculatorLayerNorm", "methods": [ { "kind": "function", "name": "MLPSpeculatorLayerNorm.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MLPSpeculatorLayerNorm.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MLPSpeculatorLayerNorm.elementwise_scale_and_shift", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculatorLayerNorm.eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculatorLayerNorm.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculatorLayerNorm.bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 0, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mlp_speculator.MLPSpeculator", "methods": [ { "kind": "function", "name": "MLPSpeculator.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MLPSpeculator.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MLPSpeculator.n_predict", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.emb_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.inner_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.max_speculative_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.tie_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.scale_input", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.state_weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.emb_weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.ln", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculator.ln0", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 5, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 17, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.mlp_speculator", "names": [ "vllm.model_executor.models.mlp_speculator.MLPSpeculator", "vllm.model_executor.models.mlp_speculator.MLPSpeculatorLayerNorm", "vllm.model_executor.models.mlp_speculator.SQRT2" ], "n_typable": 32, "n_typed": 5, "n_any": 0, "n_untyped": 27, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_classes": 2, "n_attrs": 22, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/modernbert.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.modernbert.ModernBertForTokenClassification", "methods": [ { "kind": "function", "name": "ModernBertForTokenClassification.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModernBertForTokenClassification.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModernBertForTokenClassification.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModernBertForTokenClassification.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModernBertForTokenClassification.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModernBertForTokenClassification.head_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertForTokenClassification.num_labels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertForTokenClassification.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertForTokenClassification.head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertForTokenClassification.classifier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertForTokenClassification.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 10, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.modernbert.ModernBertModel", "methods": [ { "kind": "function", "name": "ModernBertModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModernBertModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModernBertModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModernBertModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModernBertModel.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertModel.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertModel.encoder_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertModel.final_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.modernbert.ModernBertForSequenceClassification", "methods": [ { "kind": "function", "name": "ModernBertForSequenceClassification.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModernBertForSequenceClassification.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModernBertForSequenceClassification.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModernBertForSequenceClassification.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModernBertForSequenceClassification.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModernBertForSequenceClassification.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertForSequenceClassification.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertForSequenceClassification.classifier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertForSequenceClassification.pooling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertForSequenceClassification.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 10, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.modernbert.ModernBertEncoderLayer", "methods": [ { "kind": "function", "name": "ModernBertEncoderLayer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModernBertEncoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModernBertEncoderLayer.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.modernbert.ModernBertPooler", "methods": [ { "kind": "function", "name": "ModernBertPooler.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModernBertPooler.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertPooler.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertPooler.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertPooler.head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.modernbert.ModernBertMLP", "methods": [ { "kind": "function", "name": "ModernBertMLP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModernBertMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModernBertMLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertMLP.Wi", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertMLP.Wo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 4, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.modernbert.ModernBertPredictionHead", "methods": [ { "kind": "function", "name": "ModernBertPredictionHead.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModernBertPredictionHead.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModernBertPredictionHead.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertPredictionHead.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertPredictionHead.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertPredictionHead.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 2, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.modernbert.ModernBertEmbeddings", "methods": [ { "kind": "function", "name": "ModernBertEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModernBertEmbeddings.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModernBertEmbeddings.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModernBertEmbeddings.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertEmbeddings.tok_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertEmbeddings.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.modernbert.ModernBertLayer", "methods": [ { "kind": "function", "name": "ModernBertLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ModernBertLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModernBertLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertLayer.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertLayer.mlp_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertLayer.attn_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 6, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.modernbert.ModernBertAttention", "methods": [ { "kind": "function", "name": "ModernBertAttention.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ModernBertAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModernBertAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertAttention.layer_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertAttention.deterministic_flash_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertAttention.all_head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertAttention.Wqkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModernBertAttention.Wo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 6, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 12, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.modernbert", "names": [ "vllm.model_executor.models.modernbert.ModernBertAttention", "vllm.model_executor.models.modernbert.ModernBertEmbeddings", "vllm.model_executor.models.modernbert.ModernBertEncoderLayer", "vllm.model_executor.models.modernbert.ModernBertForSequenceClassification", "vllm.model_executor.models.modernbert.ModernBertForTokenClassification", "vllm.model_executor.models.modernbert.ModernBertLayer", "vllm.model_executor.models.modernbert.ModernBertMLP", "vllm.model_executor.models.modernbert.ModernBertModel", "vllm.model_executor.models.modernbert.ModernBertPooler", "vllm.model_executor.models.modernbert.ModernBertPredictionHead" ], "n_typable": 123, "n_typed": 61, "n_any": 0, "n_untyped": 62, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 26, "n_method_overloads": 26, "n_method_params": 48, "n_classes": 10, "n_attrs": 51, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/module_mapping.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.module_mapping.MultiModelKeys", "methods": [ { "kind": "function", "name": "MultiModelKeys.from_string_field", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModelKeys.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModelKeys.connector", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModelKeys.tower_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModelKeys.generator", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.module_mapping", "names": [ "vllm.model_executor.models.module_mapping.MultiModelKeys" ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/molmo.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.molmo.POOLING_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.MolmoDecoderNormAfterLayer", "methods": [ { "kind": "function", "name": "MolmoDecoderNormAfterLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.MolmoProcessingInfo", "methods": [ { "kind": "function", "name": "MolmoProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MolmoProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MolmoProcessingInfo.get_num_image_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MolmoProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.MolmoModel", "methods": [ { "kind": "function", "name": "MolmoModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MolmoModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MolmoModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MolmoModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MolmoModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoModel.embedding_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.molmo.get_num_patches", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.MultiHeadDotProductAttention", "methods": [ { "kind": "function", "name": "MultiHeadDotProductAttention.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MultiHeadDotProductAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiHeadDotProductAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadDotProductAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadDotProductAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadDotProductAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadDotProductAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadDotProductAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadDotProductAttention.wq", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadDotProductAttention.wk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadDotProductAttention.wv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadDotProductAttention.wo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadDotProductAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadDotProductAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 8, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.MolmoProcessorWrapper", "methods": [ { "kind": "function", "name": "MolmoProcessorWrapper.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MolmoProcessorWrapper.select_tiling", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MolmoProcessorWrapper.get_patches_grid_size", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MolmoProcessorWrapper.__call__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "MolmoProcessorWrapper.vocab", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MolmoProcessorWrapper.max_crops", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MolmoProcessorWrapper.base_image_input_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MolmoProcessorWrapper.image_patch_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MolmoProcessorWrapper.overlap_margins", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MolmoProcessorWrapper.image_token_length_w", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MolmoProcessorWrapper.image_token_length_h", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MolmoProcessorWrapper.message_format", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MolmoProcessorWrapper.always_start_with_space", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MolmoProcessorWrapper.image_patch_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MolmoProcessorWrapper.im_col_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MolmoProcessorWrapper.im_start_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MolmoProcessorWrapper.im_end_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MolmoProcessorWrapper.pooling_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MolmoProcessorWrapper.processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 25, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 1, "n_properties": 14 }, { "kind": "attr", "name": "vllm.model_executor.models.molmo.IM_START_TOKEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.MolmoVisionBackbone", "methods": [ { "kind": "function", "name": "MolmoVisionBackbone.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MolmoVisionBackbone.encode_image", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MolmoVisionBackbone.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MolmoVisionBackbone.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "MolmoVisionBackbone.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MolmoVisionBackbone.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MolmoVisionBackbone.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MolmoVisionBackbone.vit_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoVisionBackbone.image_num_patch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoVisionBackbone.llm_patches_per_crop", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoVisionBackbone.image_vit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoVisionBackbone.num_prefix_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoVisionBackbone.image_pooling_2d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoVisionBackbone.image_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoVisionBackbone.pad_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 14, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 9, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.MolmoDummyInputsBuilder", "methods": [ { "kind": "function", "name": "MolmoDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MolmoDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.VisionTransformer", "methods": [ { "kind": "function", "name": "VisionTransformer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VisionTransformer.add_pos_emb", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VisionTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VisionTransformer.patch_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.class_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.num_prefix_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.positional_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.pre_ln", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 10, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.MolmoDecoderLayer", "methods": [ { "kind": "function", "name": "MolmoDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MolmoDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MolmoDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 9, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.MolmoImageInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MolmoImageInputs.images", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MolmoImageInputs.image_masks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MolmoImageInputs.image_input_idx", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MolmoImageInputs.num_crops", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.MolmoAttention", "methods": [ { "kind": "function", "name": "MolmoAttention.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MolmoAttention._apply_qk_norm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MolmoAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MolmoAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.tp_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.k_norm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.q_norm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 14, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.BlockCollection", "methods": [ { "kind": "function", "name": "BlockCollection.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BlockCollection.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlockCollection.resblocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.ResidualAttentionBlock", "methods": [ { "kind": "function", "name": "ResidualAttentionBlock.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ResidualAttentionBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ResidualAttentionBlock.attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ResidualAttentionBlock.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ResidualAttentionBlock.attention_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ResidualAttentionBlock.ffn_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.ViTMLP", "methods": [ { "kind": "function", "name": "ViTMLP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ViTMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ViTMLP.w1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTMLP.w2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 5, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.VisionBackboneConfig", "methods": [ { "kind": "function", "name": "VisionBackboneConfig.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "VisionBackboneConfig.image_num_patch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "VisionBackboneConfig.image_default_input_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionBackboneConfig.image_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionBackboneConfig.image_pos_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionBackboneConfig.image_emb_dim", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionBackboneConfig.image_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionBackboneConfig.image_num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionBackboneConfig.image_num_layers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionBackboneConfig.image_mlp_dim", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionBackboneConfig.image_mlp_activations", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionBackboneConfig.image_num_pos", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionBackboneConfig.image_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 11, "n_properties": 1 }, { "kind": "function", "name": "vllm.model_executor.models.molmo.get_candidate_tilings", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.MolmoForCausalLM", "methods": [ { "kind": "function", "name": "MolmoForCausalLM.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MolmoForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MolmoForCausalLM._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MolmoForCausalLM._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MolmoForCausalLM.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MolmoForCausalLM.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MolmoForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MolmoForCausalLM.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MolmoForCausalLM.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MolmoForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MolmoForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoForCausalLM.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoForCausalLM.img_patch_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoForCausalLM.vision_backbone", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MolmoForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 21, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 14, "n_attrs": 10, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.molmo.get_patches_grid_size", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "attr", "name": "vllm.model_executor.models.molmo.NUM_PREFIX_TOKENS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.LanguageModelMLP", "methods": [ { "kind": "function", "name": "LanguageModelMLP.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LanguageModelMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LanguageModelMLP.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LanguageModelMLP.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LanguageModelMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LanguageModelMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LanguageModelMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.molmo.ADDITIONAL_VOCAB_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.molmo.IM_COL_TOKEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.molmo.VIT_LAYERS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.MolmoMultiModalProcessor", "methods": [ { "kind": "function", "name": "MolmoMultiModalProcessor._apply_hf_processor_tokens_only", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MolmoMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MolmoMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.molmo.IMAGE_PATCH_TOKEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.molmo.IM_END_TOKEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.models.molmo.select_tiling", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.molmo.ImageProjectorMLP", "methods": [ { "kind": "function", "name": "ImageProjectorMLP.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ImageProjectorMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ImageProjectorMLP.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageProjectorMLP.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageProjectorMLP.merged_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageProjectorMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageProjectorMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.molmo", "names": [ "vllm.model_executor.models.molmo.ADDITIONAL_VOCAB_SIZE", "vllm.model_executor.models.molmo.BlockCollection", "vllm.model_executor.models.molmo.IMAGE_PATCH_TOKEN", "vllm.model_executor.models.molmo.IM_COL_TOKEN", "vllm.model_executor.models.molmo.IM_END_TOKEN", "vllm.model_executor.models.molmo.IM_START_TOKEN", "vllm.model_executor.models.molmo.ImageProjectorMLP", "vllm.model_executor.models.molmo.LanguageModelMLP", "vllm.model_executor.models.molmo.MolmoAttention", "vllm.model_executor.models.molmo.MolmoDecoderLayer", "vllm.model_executor.models.molmo.MolmoDecoderNormAfterLayer", "vllm.model_executor.models.molmo.MolmoDummyInputsBuilder", "vllm.model_executor.models.molmo.MolmoForCausalLM", "vllm.model_executor.models.molmo.MolmoImageInputs", "vllm.model_executor.models.molmo.MolmoModel", "vllm.model_executor.models.molmo.MolmoMultiModalProcessor", "vllm.model_executor.models.molmo.MolmoProcessingInfo", "vllm.model_executor.models.molmo.MolmoProcessorWrapper", "vllm.model_executor.models.molmo.MolmoVisionBackbone", "vllm.model_executor.models.molmo.MultiHeadDotProductAttention", "vllm.model_executor.models.molmo.NUM_PREFIX_TOKENS", "vllm.model_executor.models.molmo.POOLING_SIZE", "vllm.model_executor.models.molmo.ResidualAttentionBlock", "vllm.model_executor.models.molmo.VIT_LAYERS", "vllm.model_executor.models.molmo.ViTMLP", "vllm.model_executor.models.molmo.VisionBackboneConfig", "vllm.model_executor.models.molmo.VisionTransformer", "vllm.model_executor.models.molmo.get_candidate_tilings", "vllm.model_executor.models.molmo.get_num_patches", "vllm.model_executor.models.molmo.get_patches_grid_size", "vllm.model_executor.models.molmo.select_tiling" ], "n_typable": 282, "n_typed": 191, "n_any": 0, "n_untyped": 91, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 16, "n_methods": 52, "n_method_overloads": 52, "n_method_params": 107, "n_classes": 19, "n_attrs": 107, "n_properties": 17, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/molmo2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.molmo2.Molmo2TextModel", "methods": [ { "kind": "function", "name": "Molmo2TextModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Molmo2TextModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Molmo2TextModel.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Molmo2TextModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Molmo2TextModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2TextModel.embedding_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2TextModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2TextModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2TextModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 12, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.Molmo2ForConditionalGeneration", "methods": [ { "kind": "function", "name": "Molmo2ForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Molmo2ForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Molmo2ForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Molmo2ForConditionalGeneration._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Molmo2ForConditionalGeneration._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Molmo2ForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Molmo2ForConditionalGeneration._process_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Molmo2ForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Molmo2ForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Molmo2ForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Molmo2ForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Molmo2ForConditionalGeneration.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Molmo2ForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "Molmo2ForConditionalGeneration.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Molmo2ForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2ForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Molmo2ForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2ForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2ForConditionalGeneration.img_patch_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2ForConditionalGeneration.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2ForConditionalGeneration.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2ForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2ForConditionalGeneration.vision_backbone", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2ForConditionalGeneration.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 44, "n_typed": 32, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 21, "n_attrs": 10, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.Molmo2ImageInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Molmo2ImageInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2ImageInputs.token_pooling", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2ImageInputs.num_pooled_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2ImageInputs.image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2ImageInputs.num_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.Molmo2VideoInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Molmo2VideoInputs.pixel_values_videos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VideoInputs.token_pooling", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VideoInputs.num_pooled_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VideoInputs.video_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VideoInputs.num_video_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.Molmo2VisionBlock", "methods": [ { "kind": "function", "name": "Molmo2VisionBlock.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Molmo2VisionBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Molmo2VisionBlock.attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VisionBlock.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VisionBlock.attention_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VisionBlock.ffn_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.Molmo2VisionTransformer", "methods": [ { "kind": "function", "name": "Molmo2VisionTransformer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Molmo2VisionTransformer.add_pos_emb", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Molmo2VisionTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Molmo2VisionTransformer.num_prefix_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VisionTransformer.patch_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VisionTransformer.positional_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VisionTransformer.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VisionTransformer.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 11, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.molmo2.get_image_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.AdapterConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AdapterConfig.vit_layers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AdapterConfig.pooling_attention_mask", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AdapterConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AdapterConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AdapterConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AdapterConfig.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AdapterConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AdapterConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AdapterConfig.text_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.Molmo2DecoderLayer", "methods": [ { "kind": "function", "name": "Molmo2DecoderLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Molmo2DecoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Molmo2DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 11, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.TextConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TextConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.additional_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.qkv_bias", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.rope_theta", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.use_qk_norm", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.qk_norm_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.layer_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.norm_after", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TextConfig.rope_scaling_layers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 17, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.molmo2.build_flat_video_bool_length", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.Molmo2MultiModalProcessor", "methods": [ { "kind": "function", "name": "Molmo2MultiModalProcessor._apply_hf_processor_tokens_only", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Molmo2MultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Molmo2MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Molmo2MultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 14, "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.Molmo2VisionBackbone", "methods": [ { "kind": "function", "name": "Molmo2VisionBackbone.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Molmo2VisionBackbone.encode_image", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Molmo2VisionBackbone.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Molmo2VisionBackbone.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Molmo2VisionBackbone.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2VisionBackbone.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Molmo2VisionBackbone.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Molmo2VisionBackbone.vit_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VisionBackbone.adapter_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VisionBackbone.vit_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VisionBackbone.image_vit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VisionBackbone.num_prefix_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VisionBackbone.image_pooling_2d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2VisionBackbone.image_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 15, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 8, "n_properties": 2 }, { "kind": "function", "name": "vllm.model_executor.models.molmo2.exif_tranpose", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.Molmo2ProcessorWrapper", "methods": [ { "kind": "function", "name": "Molmo2ProcessorWrapper.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Molmo2ProcessorWrapper.select_tiling", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Molmo2ProcessorWrapper.get_base_grid_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Molmo2ProcessorWrapper.get_patches_grid_size", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Molmo2ProcessorWrapper.__call__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [ { "kind": "property", "name": "Molmo2ProcessorWrapper.vocab", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.max_crops", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.image_pooling_h", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.image_pooling_w", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.video_pooling_h", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.video_pooling_w", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.base_image_input_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.image_patch_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.overlap_margins", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.bos_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.image_patch_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.im_col_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.im_start_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.im_end_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.low_res_im_start_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.frame_start_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.frame_end_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.im_low_res_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.image_placeholder_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.video_placeholder_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Molmo2ProcessorWrapper.image_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Molmo2ProcessorWrapper.processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2ProcessorWrapper.hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 37, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 2, "n_properties": 21 }, { "kind": "function", "name": "vllm.model_executor.models.molmo2.build_flat_image_bool_length", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.ImagePoolingAttention", "methods": [ { "kind": "function", "name": "ImagePoolingAttention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "ImagePoolingAttention.forward_sdpa", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ImagePoolingAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ImagePoolingAttention.input_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImagePoolingAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImagePoolingAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImagePoolingAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImagePoolingAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImagePoolingAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImagePoolingAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImagePoolingAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImagePoolingAttention.q_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImagePoolingAttention.merged_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImagePoolingAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImagePoolingAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImagePoolingAttention.use_pytorch_sdpa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImagePoolingAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 19, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 16, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.Molmo2ProcessingInfo", "methods": [ { "kind": "function", "name": "Molmo2ProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Molmo2ProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Molmo2ProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Molmo2ProcessingInfo.get_num_image_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Molmo2ProcessingInfo.get_num_video_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Molmo2ProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Molmo2ProcessingInfo._get_max_video_frames", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Molmo2ProcessingInfo.get_num_frames_with_most_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Molmo2ProcessingInfo._sample_frames", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Molmo2ProcessingInfo._get_video_second_idx", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 29, "n_typed": 28, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 19, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.ViTMLP", "methods": [ { "kind": "function", "name": "ViTMLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ViTMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ViTMLP.w1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTMLP.w2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.Molmo2Attention", "methods": [ { "kind": "function", "name": "Molmo2Attention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Molmo2Attention._apply_qk_norm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Molmo2Attention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Molmo2Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.rope_theta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.tp_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.k_norm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.q_norm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.qk_norm_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Molmo2Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 17, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 20, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.molmo2.get_candidate_tilings", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.molmo2.get_patches_grid_size", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.model_executor.models.molmo2.VIDEO_PROMPT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.LanguageModelMLP", "methods": [ { "kind": "function", "name": "LanguageModelMLP.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LanguageModelMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LanguageModelMLP.up_gate_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LanguageModelMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LanguageModelMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 7, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.molmo2.get_frame_times_and_chosen_fps", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.model_executor.models.molmo2.IMAGE_PROMPT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.VitConfig", "methods": [ { "kind": "function", "name": "VitConfig.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "VitConfig.image_num_patch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "VitConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VitConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VitConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VitConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VitConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VitConfig.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VitConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VitConfig.layer_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VitConfig.image_default_input_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VitConfig.image_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VitConfig.image_num_pos", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 11, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.Molmo2DummyInputsBuilder", "methods": [ { "kind": "function", "name": "Molmo2DummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Molmo2DummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Molmo2DummyInputsBuilder._get_dummy_videos", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.Molmo2DecoderNormAfterLayer", "methods": [ { "kind": "function", "name": "Molmo2DecoderNormAfterLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.molmo2.get_target_fps", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.ViTMultiHeadDotProductAttention", "methods": [ { "kind": "function", "name": "ViTMultiHeadDotProductAttention.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "ViTMultiHeadDotProductAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ViTMultiHeadDotProductAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTMultiHeadDotProductAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTMultiHeadDotProductAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTMultiHeadDotProductAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTMultiHeadDotProductAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTMultiHeadDotProductAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTMultiHeadDotProductAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTMultiHeadDotProductAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTMultiHeadDotProductAttention.merged_qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTMultiHeadDotProductAttention.wo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTMultiHeadDotProductAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTMultiHeadDotProductAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 10, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 12, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.molmo2.select_tiling", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.ImageProjectorMLP", "methods": [ { "kind": "function", "name": "ImageProjectorMLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ImageProjectorMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ImageProjectorMLP.merged_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageProjectorMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageProjectorMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.molmo2.Molmo2VisionBlockCollection", "methods": [ { "kind": "function", "name": "Molmo2VisionBlockCollection.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Molmo2VisionBlockCollection.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Molmo2VisionBlockCollection.resblocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.molmo2.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.models.molmo2.get_candidate_target_fps", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.models.molmo2", "names": [ "vllm.model_executor.models.molmo2.AdapterConfig", "vllm.model_executor.models.molmo2.IMAGE_PROMPT", "vllm.model_executor.models.molmo2.ImagePoolingAttention", "vllm.model_executor.models.molmo2.ImageProjectorMLP", "vllm.model_executor.models.molmo2.LanguageModelMLP", "vllm.model_executor.models.molmo2.Molmo2Attention", "vllm.model_executor.models.molmo2.Molmo2DecoderLayer", "vllm.model_executor.models.molmo2.Molmo2DecoderNormAfterLayer", "vllm.model_executor.models.molmo2.Molmo2DummyInputsBuilder", "vllm.model_executor.models.molmo2.Molmo2ForConditionalGeneration", "vllm.model_executor.models.molmo2.Molmo2ImageInputs", "vllm.model_executor.models.molmo2.Molmo2MultiModalProcessor", "vllm.model_executor.models.molmo2.Molmo2ProcessingInfo", "vllm.model_executor.models.molmo2.Molmo2ProcessorWrapper", "vllm.model_executor.models.molmo2.Molmo2TextModel", "vllm.model_executor.models.molmo2.Molmo2VideoInputs", "vllm.model_executor.models.molmo2.Molmo2VisionBackbone", "vllm.model_executor.models.molmo2.Molmo2VisionBlock", "vllm.model_executor.models.molmo2.Molmo2VisionBlockCollection", "vllm.model_executor.models.molmo2.Molmo2VisionTransformer", "vllm.model_executor.models.molmo2.TextConfig", "vllm.model_executor.models.molmo2.VIDEO_PROMPT", "vllm.model_executor.models.molmo2.ViTMLP", "vllm.model_executor.models.molmo2.ViTMultiHeadDotProductAttention", "vllm.model_executor.models.molmo2.VitConfig", "vllm.model_executor.models.molmo2.build_flat_image_bool_length", "vllm.model_executor.models.molmo2.build_flat_video_bool_length", "vllm.model_executor.models.molmo2.exif_tranpose", "vllm.model_executor.models.molmo2.get_candidate_target_fps", "vllm.model_executor.models.molmo2.get_candidate_tilings", "vllm.model_executor.models.molmo2.get_frame_times_and_chosen_fps", "vllm.model_executor.models.molmo2.get_image_size", "vllm.model_executor.models.molmo2.get_patches_grid_size", "vllm.model_executor.models.molmo2.get_target_fps", "vllm.model_executor.models.molmo2.logger", "vllm.model_executor.models.molmo2.select_tiling" ], "n_typable": 407, "n_typed": 306, "n_any": 0, "n_untyped": 101, "n_functions": 10, "n_function_overloads": 10, "n_function_params": 34, "n_methods": 68, "n_method_overloads": 68, "n_method_params": 167, "n_classes": 23, "n_attrs": 144, "n_properties": 25, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/moonvit.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.moonvit.apply_rope", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.models.moonvit.MoonVitEncoderLayer", "methods": [ { "kind": "function", "name": "MoonVitEncoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MoonVitEncoderLayer.attention_qkvpacked", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MoonVitEncoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoonVitEncoderLayer.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitEncoderLayer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitEncoderLayer.hidden_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitEncoderLayer.hidden_size_per_attention_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitEncoderLayer.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitEncoderLayer.num_attention_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitEncoderLayer.norm0", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitEncoderLayer.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitEncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitEncoderLayer.wqkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitEncoderLayer.wo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitEncoderLayer.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 12, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 12, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.moonvit.Learnable2DInterpPosEmb", "methods": [ { "kind": "function", "name": "Learnable2DInterpPosEmb.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Learnable2DInterpPosEmb.reset_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Learnable2DInterpPosEmb.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Learnable2DInterpPosEmb.height", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Learnable2DInterpPosEmb.width", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Learnable2DInterpPosEmb.interpolation_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Learnable2DInterpPosEmb.weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.moonvit.Rope2DPosEmb", "methods": [ { "kind": "function", "name": "Rope2DPosEmb.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Rope2DPosEmb.extra_repr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Rope2DPosEmb.get_freqs_cis_by_seqlens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Rope2DPosEmb.get_freqs_cis_by_idx", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "Rope2DPosEmb.precomputed_freqs_cis", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Rope2DPosEmb.dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Rope2DPosEmb.max_height", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Rope2DPosEmb.max_width", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Rope2DPosEmb.theta_base", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Rope2DPosEmb.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 9, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 1 }, { "kind": "function", "name": "vllm.model_executor.models.moonvit.patch_merger", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.models.moonvit.MoonVisionPatchEmbed", "methods": [ { "kind": "function", "name": "MoonVisionPatchEmbed.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MoonVisionPatchEmbed.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoonVisionPatchEmbed.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVisionPatchEmbed.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVisionPatchEmbed.pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.moonvit.MLP2", "methods": [ { "kind": "function", "name": "MLP2.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MLP2.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MLP2.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLP2.fc0", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLP2.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLP2.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 5, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.moonvit.MoonVitEncoder", "methods": [ { "kind": "function", "name": "MoonVitEncoder.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MoonVitEncoder.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoonVitEncoder.rope_2d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitEncoder.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitEncoder.final_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.moonvit.MoonVitPretrainedModel", "methods": [ { "kind": "function", "name": "MoonVitPretrainedModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MoonVitPretrainedModel.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoonVitPretrainedModel.config_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoonVitPretrainedModel.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoonVitPretrainedModel._no_split_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoonVitPretrainedModel._supports_flash_attn_2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoonVitPretrainedModel._supports_sdpa", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoonVitPretrainedModel.merge_kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitPretrainedModel.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitPretrainedModel.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitPretrainedModel.vit_processing_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitPretrainedModel.patch_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonVitPretrainedModel.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 5, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 11, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.moonvit", "names": [ "vllm.model_executor.models.moonvit.Learnable2DInterpPosEmb", "vllm.model_executor.models.moonvit.MLP2", "vllm.model_executor.models.moonvit.MoonVisionPatchEmbed", "vllm.model_executor.models.moonvit.MoonVitEncoder", "vllm.model_executor.models.moonvit.MoonVitEncoderLayer", "vllm.model_executor.models.moonvit.MoonVitPretrainedModel", "vllm.model_executor.models.moonvit.Rope2DPosEmb", "vllm.model_executor.models.moonvit.apply_rope", "vllm.model_executor.models.moonvit.patch_merger" ], "n_typable": 114, "n_typed": 63, "n_any": 0, "n_untyped": 51, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 6, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 50, "n_classes": 7, "n_attrs": 42, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/mpt.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.mpt.MPTForCausalLM", "methods": [ { "kind": "function", "name": "MPTForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MPTForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MPTForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MPTForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MPTForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MPTForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTForCausalLM.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mpt.MPTMLP", "methods": [ { "kind": "function", "name": "MPTMLP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MPTMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MPTMLP.up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 5, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mpt.MPTBlock", "methods": [ { "kind": "function", "name": "MPTBlock.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MPTBlock.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MPTBlock.norm_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTBlock.norm_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTBlock.ffn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mpt.MPTModel", "methods": [ { "kind": "function", "name": "MPTModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MPTModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MPTModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MPTModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MPTModel.wte", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTModel.norm_f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 11, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.mpt.MPTAttention", "methods": [ { "kind": "function", "name": "MPTAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MPTAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MPTAttention.d_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTAttention.clip_qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTAttention.qk_ln", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTAttention.alibi_bias_max", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTAttention.Wqkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTAttention.q_ln", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPTAttention.k_ln", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 7, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 16, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.mpt", "names": [ "vllm.model_executor.models.mpt.MPTAttention", "vllm.model_executor.models.mpt.MPTBlock", "vllm.model_executor.models.mpt.MPTForCausalLM", "vllm.model_executor.models.mpt.MPTMLP", "vllm.model_executor.models.mpt.MPTModel" ], "n_typable": 80, "n_typed": 43, "n_any": 0, "n_untyped": 37, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 33, "n_classes": 5, "n_attrs": 32, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/musicflamingo.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.musicflamingo.MusicFlamingoProcessingInfo", "methods": [ { "kind": "function", "name": "MusicFlamingoProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MusicFlamingoProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MusicFlamingoProcessingInfo.get_feature_extractor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MusicFlamingoProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.musicflamingo.MusicFlamingoProcessor", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.musicflamingo.MusicFlamingoConfig", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.musicflamingo.MusicFlamingoDummyInputsBuilder", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.musicflamingo.MusicFlamingoForConditionalGeneration", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.musicflamingo", "names": [ "vllm.model_executor.models.musicflamingo.MusicFlamingoConfig", "vllm.model_executor.models.musicflamingo.MusicFlamingoDummyInputsBuilder", "vllm.model_executor.models.musicflamingo.MusicFlamingoForConditionalGeneration", "vllm.model_executor.models.musicflamingo.MusicFlamingoProcessingInfo", "vllm.model_executor.models.musicflamingo.MusicFlamingoProcessor" ], "n_typable": 6, "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_classes": 3, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/nano_nemotron_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.BaseNanoNemotronVLProcessor", "methods": [ { "kind": "function", "name": "BaseNanoNemotronVLProcessor.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BaseNanoNemotronVLProcessor.use_dynamic_resolution", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseNanoNemotronVLProcessor.get_image_repl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseNanoNemotronVLProcessor.get_num_image_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseNanoNemotronVLProcessor._images_to_pixel_values_lst", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseNanoNemotronVLProcessor._preprocess_image", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseNanoNemotronVLProcessor._make_batch_input", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseNanoNemotronVLProcessor.__call__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "BaseNanoNemotronVLProcessor.image_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "BaseNanoNemotronVLProcessor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseNanoNemotronVLProcessor.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseNanoNemotronVLProcessor.max_num_tiles", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseNanoNemotronVLProcessor.num_image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseNanoNemotronVLProcessor.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseNanoNemotronVLProcessor.use_thumbnail", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseNanoNemotronVLProcessor.norm_mean", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseNanoNemotronVLProcessor.norm_std", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseNanoNemotronVLProcessor.dynamic_tiler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 40, "n_typed": 30, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 22, "n_attrs": 9, "n_properties": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.nano_nemotron_vl.AUDIO_END", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.nano_nemotron_vl.MAX_AUDIO_LEN_S", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NanoNemotronVLImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLImagePixelInputs.pixel_values_flat", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLImagePixelInputs.num_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.DynamicResolutionParams", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DynamicResolutionParams.media", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DynamicResolutionParams.num_tiles", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DynamicResolutionParams.num_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DynamicResolutionParams.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLProcessingInfo", "methods": [ { "kind": "function", "name": "NanoNemotronVLProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NanoNemotronVLProcessingInfo.get_supported_mm_limits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NanoNemotronVLProcessingInfo.get_video_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NanoNemotronVLProcessingInfo.get_video_pruning_rate", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NanoNemotronVLProcessingInfo.get_num_frames_with_most_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NanoNemotronVLProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "NanoNemotronVLProcessingInfo.supports_video", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "NanoNemotronVLProcessingInfo.audio_extractor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 3, "n_attrs": 0, "n_properties": 2 }, { "kind": "function", "name": "vllm.model_executor.models.nano_nemotron_vl.video_to_pixel_values", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLVideoEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NanoNemotronVLVideoEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLVideoEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.NemotronH_Nano_VL_V2", "methods": [ { "kind": "function", "name": "NemotronH_Nano_VL_V2.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.pixel_shuffle", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.pixel_shuffle_dynamic_res", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.extract_feature_dynamic", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.extract_feature", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2._process_image_input_dynamic", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2._process_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2._process_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2._create_final_video_embeddings", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.get_vit_model_from_radio_config", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.copy_inputs_before_cuda_graphs", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.get_seqlen_agnostic_capture_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.get_mamba_state_shape_from_config", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.get_mamba_state_dtype_from_config", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronH_Nano_VL_V2.get_mamba_state_copy_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronH_Nano_VL_V2.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronH_Nano_VL_V2.template", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronH_Nano_VL_V2.num_image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronH_Nano_VL_V2.downsample_ratio", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronH_Nano_VL_V2.ps_version", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronH_Nano_VL_V2.image_tag_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronH_Nano_VL_V2.video_pruning_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronH_Nano_VL_V2.llm_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronH_Nano_VL_V2.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronH_Nano_VL_V2.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronH_Nano_VL_V2.dynamic_resolution", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronH_Nano_VL_V2.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronH_Nano_VL_V2.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronH_Nano_VL_V2.mlp1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronH_Nano_VL_V2.sound_encoder", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 76, "n_typed": 46, "n_any": 0, "n_untyped": 30, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 25, "n_method_overloads": 25, "n_method_params": 36, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NanoNemotronVLImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.models.nano_nemotron_vl.image_to_pixel_values", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.model_executor.models.nano_nemotron_vl.IMG_END", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLDummyInputsBuilder", "methods": [ { "kind": "function", "name": "NanoNemotronVLDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NanoNemotronVLDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLProcessor", "methods": [ { "kind": "function", "name": "NanoNemotronVLProcessor.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "NanoNemotronVLProcessor._videos_to_pixel_values_lst", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NanoNemotronVLProcessor._preprocess_video", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "NanoNemotronVLProcessor._preprocess_audio", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NanoNemotronVLProcessor.__call__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "NanoNemotronVLProcessor.get_image_repl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NanoNemotronVLProcessor.get_audio_repl", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NanoNemotronVLProcessor.get_video_repl", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [ { "kind": "property", "name": "NanoNemotronVLProcessor.supports_video", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "NanoNemotronVLProcessor.video_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "NanoNemotronVLProcessor.image_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "NanoNemotronVLProcessor.video_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLProcessor.video_pruning_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLProcessor.audio_extractor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 43, "n_typed": 39, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 29, "n_attrs": 3, "n_properties": 3 }, { "kind": "attr", "name": "vllm.model_executor.models.nano_nemotron_vl.IMG_CONTEXT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.models.nano_nemotron_vl.calculate_timestamps", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLImagePixelInputsDynamic", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NanoNemotronVLImagePixelInputsDynamic.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLImagePixelInputsDynamic.pixel_values_flat", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLImagePixelInputsDynamic.imgs_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLImagePixelInputsDynamic.num_tokens_per_image", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.DynamicResolutionImageTiler", "methods": [ { "kind": "function", "name": "DynamicResolutionImageTiler.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "DynamicResolutionImageTiler._get_num_embeddings", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DynamicResolutionImageTiler.width_and_height_for_max_num_tokens_available", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DynamicResolutionImageTiler.max_num_tokens_available", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DynamicResolutionImageTiler._images_to_pixel_values_lst", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DynamicResolutionImageTiler.get_cached_feature_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DynamicResolutionImageTiler.apply_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DynamicResolutionImageTiler.process_media", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DynamicResolutionImageTiler.compute_params", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DynamicResolutionImageTiler.stack", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DynamicResolutionImageTiler.CONV_MERGING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DynamicResolutionImageTiler.PIXEL_SHUFFLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DynamicResolutionImageTiler.USE_THUMBNAIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DynamicResolutionImageTiler.norm_mean", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DynamicResolutionImageTiler.norm_std", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DynamicResolutionImageTiler.feature_size_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 36, "n_typed": 34, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 23, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.nano_nemotron_vl.AUDIO_START", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLAudioFeatureInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NanoNemotronVLAudioFeatureInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLAudioFeatureInputs.input_audio_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLAudioFeatureInputs.feature_attention_mask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLAudioFeatureInputs.audio_feature_lengths", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.nano_nemotron_vl.dynamic_preprocess", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.model_executor.models.nano_nemotron_vl.DEFAULT_NUM_TILES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.BaseNanoNemotronVLProcessingInfo", "methods": [ { "kind": "function", "name": "BaseNanoNemotronVLProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseNanoNemotronVLProcessingInfo.get_default_tok_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseNanoNemotronVLProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseNanoNemotronVLProcessingInfo.get_image_size_with_most_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseNanoNemotronVLProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.nano_nemotron_vl.input_conditioner", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.model_executor.models.nano_nemotron_vl.AUDIO_CONTEXT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLVideoPixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NanoNemotronVLVideoPixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLVideoPixelInputs.pixel_values_flat", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLVideoPixelInputs.num_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLVideoPixelInputs.frames_indices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NanoNemotronVLVideoPixelInputs.frame_duration_ms", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronBaseVLMultiModalProcessor", "methods": [ { "kind": "function", "name": "NanoNemotronBaseVLMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NanoNemotronBaseVLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "NanoNemotronBaseVLMultiModalProcessor.is_dynamic_tiler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.nano_nemotron_vl.IMG_START", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLMultiModalProcessor", "methods": [ { "kind": "function", "name": "NanoNemotronVLMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NanoNemotronVLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLVideoInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.nano_nemotron_vl.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.nano_nemotron_vl", "names": [ "vllm.model_executor.models.nano_nemotron_vl.AUDIO_CONTEXT", "vllm.model_executor.models.nano_nemotron_vl.AUDIO_END", "vllm.model_executor.models.nano_nemotron_vl.AUDIO_START", "vllm.model_executor.models.nano_nemotron_vl.BaseNanoNemotronVLProcessingInfo", "vllm.model_executor.models.nano_nemotron_vl.BaseNanoNemotronVLProcessor", "vllm.model_executor.models.nano_nemotron_vl.DEFAULT_NUM_TILES", "vllm.model_executor.models.nano_nemotron_vl.DynamicResolutionImageTiler", "vllm.model_executor.models.nano_nemotron_vl.DynamicResolutionParams", "vllm.model_executor.models.nano_nemotron_vl.IMG_CONTEXT", "vllm.model_executor.models.nano_nemotron_vl.IMG_END", "vllm.model_executor.models.nano_nemotron_vl.IMG_START", "vllm.model_executor.models.nano_nemotron_vl.MAX_AUDIO_LEN_S", "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronBaseVLMultiModalProcessor", "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLAudioFeatureInputs", "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLDummyInputsBuilder", "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLImageEmbeddingInputs", "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLImageInputs", "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLImagePixelInputs", "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLImagePixelInputsDynamic", "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLMultiModalProcessor", "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLProcessingInfo", "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLProcessor", "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLVideoEmbeddingInputs", "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLVideoInputs", "vllm.model_executor.models.nano_nemotron_vl.NanoNemotronVLVideoPixelInputs", "vllm.model_executor.models.nano_nemotron_vl.NemotronH_Nano_VL_V2", "vllm.model_executor.models.nano_nemotron_vl.calculate_timestamps", "vllm.model_executor.models.nano_nemotron_vl.dynamic_preprocess", "vllm.model_executor.models.nano_nemotron_vl.image_to_pixel_values", "vllm.model_executor.models.nano_nemotron_vl.input_conditioner", "vllm.model_executor.models.nano_nemotron_vl.logger", "vllm.model_executor.models.nano_nemotron_vl.video_to_pixel_values" ], "n_typable": 281, "n_typed": 220, "n_any": 0, "n_untyped": 61, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 19, "n_methods": 68, "n_method_overloads": 68, "n_method_params": 129, "n_classes": 16, "n_attrs": 68, "n_properties": 7, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/nemotron.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.nemotron.NemotronMLP", "methods": [ { "kind": "function", "name": "NemotronMLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "NemotronMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronMLP.up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron.NemotronForCausalLM", "methods": [ { "kind": "function", "name": "NemotronForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NemotronForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NemotronForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NemotronForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron.NemotronLayerNorm1P", "methods": [ { "kind": "function", "name": "NemotronLayerNorm1P.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "NemotronLayerNorm1P.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 7, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron.NemotronAttention", "methods": [ { "kind": "function", "name": "NemotronAttention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "NemotronAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 13, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron.NemotronModel", "methods": [ { "kind": "function", "name": "NemotronModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NemotronModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron.NemotronDecoderLayer", "methods": [ { "kind": "function", "name": "NemotronDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NemotronDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.nemotron", "names": [ "vllm.model_executor.models.nemotron.NemotronAttention", "vllm.model_executor.models.nemotron.NemotronDecoderLayer", "vllm.model_executor.models.nemotron.NemotronForCausalLM", "vllm.model_executor.models.nemotron.NemotronLayerNorm1P", "vllm.model_executor.models.nemotron.NemotronMLP", "vllm.model_executor.models.nemotron.NemotronModel" ], "n_typable": 101, "n_typed": 60, "n_any": 0, "n_untyped": 41, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 50, "n_classes": 6, "n_attrs": 36, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/nemotron_h.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.nemotron_h.NemotronHAttention", "methods": [ { "kind": "function", "name": "NemotronHAttention.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "NemotronHAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronHAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 9, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_h.NemotronHMLPDecoderLayer", "methods": [ { "kind": "function", "name": "NemotronHMLPDecoderLayer.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "NemotronHMLPDecoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronHMLPDecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMLPDecoderLayer.mixer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMLPDecoderLayer.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_h.NemotronHAttentionDecoderLayer", "methods": [ { "kind": "function", "name": "NemotronHAttentionDecoderLayer.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "NemotronHAttentionDecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronHAttentionDecoderLayer.mixer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHAttentionDecoderLayer.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 11, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_h.NemotronHMLP", "methods": [ { "kind": "function", "name": "NemotronHMLP.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "NemotronHMLP.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronHMLP.up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 10, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_h.NemotronHMoE", "methods": [ { "kind": "function", "name": "NemotronHMoE.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NemotronHMoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronHMoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.n_routed_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.n_shared_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.use_latent_moe", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.moe_hidden_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.is_sequence_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.fc1_latent_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoE.fc2_latent_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 10, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 22, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_h.NemotronHMambaDecoderLayer", "methods": [ { "kind": "function", "name": "NemotronHMambaDecoderLayer.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "NemotronHMambaDecoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronHMambaDecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMambaDecoderLayer.mixer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMambaDecoderLayer.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_h.NemotronHModel", "methods": [ { "kind": "function", "name": "NemotronHModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronHModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronHModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NemotronHModel.is_spec_layer", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronHModel._get_max_n_routed_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NemotronHModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NemotronHModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronHModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHModel.has_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHModel.norm_f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 16, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 10, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_h.NemotronHForCausalLM", "methods": [ { "kind": "function", "name": "NemotronHForCausalLM.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronHForCausalLM.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronHForCausalLM.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NemotronHForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronHForCausalLM.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronHForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronHForCausalLM.forward", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "NemotronHForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronHForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronHForCausalLM.is_non_gated_moe", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NemotronHForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NemotronHForCausalLM.lora_skip_prefixes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NemotronHForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.expert_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.num_expert_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.num_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.num_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.num_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.num_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.num_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHForCausalLM.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 44, "n_typed": 21, "n_any": 0, "n_untyped": 23, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 14, "n_attrs": 24, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.nemotron_h.ALL_DECODER_LAYER_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_h.NemotronHMoEDecoderLayer", "methods": [ { "kind": "function", "name": "NemotronHMoEDecoderLayer.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "NemotronHMoEDecoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronHMoEDecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoEDecoderLayer.mixer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMoEDecoderLayer.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.nemotron_h", "names": [ "vllm.model_executor.models.nemotron_h.ALL_DECODER_LAYER_TYPES", "vllm.model_executor.models.nemotron_h.NemotronHAttention", "vllm.model_executor.models.nemotron_h.NemotronHAttentionDecoderLayer", "vllm.model_executor.models.nemotron_h.NemotronHForCausalLM", "vllm.model_executor.models.nemotron_h.NemotronHMLP", "vllm.model_executor.models.nemotron_h.NemotronHMLPDecoderLayer", "vllm.model_executor.models.nemotron_h.NemotronHMambaDecoderLayer", "vllm.model_executor.models.nemotron_h.NemotronHMoE", "vllm.model_executor.models.nemotron_h.NemotronHMoEDecoderLayer", "vllm.model_executor.models.nemotron_h.NemotronHModel" ], "n_typable": 192, "n_typed": 107, "n_any": 0, "n_untyped": 85, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 30, "n_method_overloads": 30, "n_method_params": 87, "n_classes": 9, "n_attrs": 79, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/nemotron_h_mtp.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.nemotron_h_mtp.NemotronHMTPMoEDecoderLayer", "methods": [ { "kind": "function", "name": "NemotronHMTPMoEDecoderLayer.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "NemotronHMTPMoEDecoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronHMTPMoEDecoderLayer.has_start_projections", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTPMoEDecoderLayer.has_end_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTPMoEDecoderLayer.enorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTPMoEDecoderLayer.hnorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTPMoEDecoderLayer.eh_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTPMoEDecoderLayer.final_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 15, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 13, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_h_mtp.NemotronHMTP", "methods": [ { "kind": "function", "name": "NemotronHMTP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronHMTP.get_input_embeddings", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronHMTP.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "NemotronHMTP.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronHMTP.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronHMTP.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NemotronHMTP.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTP.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTP.mtp_start_layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTP.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTP.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTP.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTP.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTP.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 15, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 11, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_h_mtp.NemotronHMultiTokenPredictor", "methods": [ { "kind": "function", "name": "NemotronHMultiTokenPredictor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronHMultiTokenPredictor.get_input_embeddings", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronHMultiTokenPredictor.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronHMultiTokenPredictor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMultiTokenPredictor.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMultiTokenPredictor.org_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMultiTokenPredictor.mtp_start_layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMultiTokenPredictor.num_mtp_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMultiTokenPredictor.pattern_str", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMultiTokenPredictor.pattern_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMultiTokenPredictor.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMultiTokenPredictor.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMultiTokenPredictor.make_empty_intermediate_tensors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 21, "n_typed": 11, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_h_mtp.NemotronHMTPAttentionDecoderLayer", "methods": [ { "kind": "function", "name": "NemotronHMTPAttentionDecoderLayer.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "NemotronHMTPAttentionDecoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronHMTPAttentionDecoderLayer.has_start_projections", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTPAttentionDecoderLayer.has_end_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTPAttentionDecoderLayer.enorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTPAttentionDecoderLayer.hnorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTPAttentionDecoderLayer.eh_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHMTPAttentionDecoderLayer.final_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 15, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 13, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.nemotron_h_mtp", "names": [ "vllm.model_executor.models.nemotron_h_mtp.NemotronHMTP", "vllm.model_executor.models.nemotron_h_mtp.NemotronHMTPAttentionDecoderLayer", "vllm.model_executor.models.nemotron_h_mtp.NemotronHMTPMoEDecoderLayer", "vllm.model_executor.models.nemotron_h_mtp.NemotronHMultiTokenPredictor" ], "n_typable": 88, "n_typed": 56, "n_any": 0, "n_untyped": 32, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 45, "n_classes": 4, "n_attrs": 32, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/nemotron_nas.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.nemotron_nas.DeciLMAttention", "methods": [ { "kind": "function", "name": "DeciLMAttention.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "DeciLMAttention._init_rotary_emb", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 15, "n_typed": 14, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 13, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_nas.DeciLMForCausalLM", "methods": [ { "kind": "function", "name": "DeciLMForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeciLMForCausalLM._init_model", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeciLMForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeciLMForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeciLMForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeciLMForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeciLMForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeciLMForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeciLMForCausalLM.mistral_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeciLMForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeciLMForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeciLMForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeciLMForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeciLMForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 15, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 11, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_nas.DeciModel", "methods": [ { "kind": "function", "name": "DeciModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeciModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeciModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeciModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeciModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeciModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeciModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeciModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeciModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeciModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 12, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_nas.DeciLMDecoderLayer", "methods": [ { "kind": "function", "name": "DeciLMDecoderLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DeciLMDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeciLMDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeciLMDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeciLMDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeciLMDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeciLMDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.nemotron_nas", "names": [ "vllm.model_executor.models.nemotron_nas.DeciLMAttention", "vllm.model_executor.models.nemotron_nas.DeciLMDecoderLayer", "vllm.model_executor.models.nemotron_nas.DeciLMForCausalLM", "vllm.model_executor.models.nemotron_nas.DeciModel" ], "n_typable": 71, "n_typed": 51, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 41, "n_classes": 4, "n_attrs": 19, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/nemotron_parse.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.nemotron_parse.MBartDecoderNoPos", "methods": [ { "kind": "function", "name": "MBartDecoderNoPos.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MBartDecoderNoPos.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MBartDecoderNoPos.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MBartDecoderNoPos.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MBartDecoderNoPos.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MBartDecoderNoPos.lora_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MBartDecoderNoPos.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MBartDecoderNoPos.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MBartDecoderNoPos.layernorm_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MBartDecoderNoPos.layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 12, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_parse.NemotronParseMultiModalProcessor", "methods": [ { "kind": "function", "name": "NemotronParseMultiModalProcessor.create_encoder_prompt", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronParseMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NemotronParseMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronParseMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 15, "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_parse.NemotronParsePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronParsePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "NemotronParsePixelInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.nemotron_parse.DEFAULT_FINAL_IMAGE_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_parse.NemotronParseProcessingInfo", "methods": [ { "kind": "function", "name": "NemotronParseProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NemotronParseProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronParseProcessingInfo.get_default_tok_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NemotronParseProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NemotronParseProcessingInfo.get_num_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NemotronParseProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "NemotronParseProcessingInfo.skip_prompt_length_check", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 10, "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 3, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_parse.BartScaledWordEmbedding", "methods": [ { "kind": "function", "name": "BartScaledWordEmbedding.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BartScaledWordEmbedding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BartScaledWordEmbedding.embed_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_parse.BartParallelLMHead", "methods": [ { "kind": "function", "name": "BartParallelLMHead.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BartParallelLMHead.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BartParallelLMHead.embed_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_parse.NemotronParseProcessor", "methods": [ { "kind": "function", "name": "NemotronParseProcessor.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "NemotronParseProcessor._make_batch_input", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronParseProcessor.__call__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronParseProcessor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronParseProcessor.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronParseProcessor.image_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 7, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_parse.NemotronParseImageProcessor", "methods": [ { "kind": "function", "name": "NemotronParseImageProcessor.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronParseImageProcessor._create_transforms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NemotronParseImageProcessor._resize_with_aspect_ratio", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronParseImageProcessor._pad_to_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronParseImageProcessor.preprocess", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronParseImageProcessor.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronParseImageProcessor.norm_mean", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronParseImageProcessor.norm_std", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronParseImageProcessor.final_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 9, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_parse.RadioWithNeck", "methods": [ { "kind": "function", "name": "RadioWithNeck.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RadioWithNeck.get_vit_model_from_radio_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RadioWithNeck.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RadioWithNeck.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RadioWithNeck.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioWithNeck.model_encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioWithNeck.conv1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioWithNeck.layer_norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioWithNeck.conv2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioWithNeck.layer_norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioWithNeck.sum_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioWithNeck.layer_norm3", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 9, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_parse.MBartDecoderLayer", "methods": [ { "kind": "function", "name": "MBartDecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_parse.BartDecoderLayer", "methods": [ { "kind": "function", "name": "BartDecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BartDecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BartDecoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BartDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BartDecoderLayer.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BartDecoderLayer.self_attn_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BartDecoderLayer.encoder_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BartDecoderLayer.encoder_attn_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BartDecoderLayer.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BartDecoderLayer.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BartDecoderLayer.final_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 7, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_parse.NemotronParseForConditionalGeneration", "methods": [ { "kind": "function", "name": "NemotronParseForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronParseForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronParseForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronParseForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronParseForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronParseForConditionalGeneration.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NemotronParseForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronParseForConditionalGeneration.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronParseForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronParseForConditionalGeneration.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronParseForConditionalGeneration.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronParseForConditionalGeneration.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronParseForConditionalGeneration.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronParseForConditionalGeneration.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronParseForConditionalGeneration.decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 18, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 13, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.nemotron_parse.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_parse.NemotronParseDummyInputsBuilder", "methods": [ { "kind": "function", "name": "NemotronParseDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronParseDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.nemotron_parse", "names": [ "vllm.model_executor.models.nemotron_parse.BartDecoderLayer", "vllm.model_executor.models.nemotron_parse.BartParallelLMHead", "vllm.model_executor.models.nemotron_parse.BartScaledWordEmbedding", "vllm.model_executor.models.nemotron_parse.DEFAULT_FINAL_IMAGE_SIZE", "vllm.model_executor.models.nemotron_parse.MBartDecoderLayer", "vllm.model_executor.models.nemotron_parse.MBartDecoderNoPos", "vllm.model_executor.models.nemotron_parse.NemotronParseDummyInputsBuilder", "vllm.model_executor.models.nemotron_parse.NemotronParseForConditionalGeneration", "vllm.model_executor.models.nemotron_parse.NemotronParseImageProcessor", "vllm.model_executor.models.nemotron_parse.NemotronParseMultiModalProcessor", "vllm.model_executor.models.nemotron_parse.NemotronParsePixelInputs", "vllm.model_executor.models.nemotron_parse.NemotronParseProcessingInfo", "vllm.model_executor.models.nemotron_parse.NemotronParseProcessor", "vllm.model_executor.models.nemotron_parse.RadioWithNeck", "vllm.model_executor.models.nemotron_parse.logger" ], "n_typable": 168, "n_typed": 106, "n_any": 0, "n_untyped": 62, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 43, "n_method_overloads": 43, "n_method_params": 82, "n_classes": 13, "n_attrs": 43, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/nemotron_vl.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.nemotron_vl.SIGLIP_MEAN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.models.nemotron_vl.calculate_nemotron_vl_targets", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.models.nemotron_vl.get_nemotron_vl_target_ratios", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.models.nemotron_vl.SIGLIP_STD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.models.nemotron_vl.build_siglip_transform", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_vl.LlamaNemotronVLForSequenceClassification", "methods": [ { "kind": "function", "name": "LlamaNemotronVLForSequenceClassification.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlamaNemotronVLForSequenceClassification.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlamaNemotronVLForSequenceClassification.weight_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaNemotronVLForSequenceClassification.score", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaNemotronVLForSequenceClassification.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.nemotron_vl.build_transform", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_vl.NemotronVLProcessor", "methods": [ { "kind": "function", "name": "NemotronVLProcessor.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "NemotronVLProcessor._get_transform", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NemotronVLProcessor.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronVLProcessor._images_to_pixel_values_lst", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NemotronVLProcessor._replace_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemotronVLProcessor._preprocess_image", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "NemotronVLProcessor.get_image_repl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "NemotronVLProcessor.image_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "NemotronVLProcessor.IMG_START", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NemotronVLProcessor.IMG_END", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NemotronVLProcessor.IMG_CONTEXT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NemotronVLProcessor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronVLProcessor.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronVLProcessor.image_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronVLProcessor.num_image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronVLProcessor.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronVLProcessor.min_dynamic_patch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronVLProcessor.max_dynamic_patch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronVLProcessor.dynamic_image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronVLProcessor.use_thumbnail", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 38, "n_typed": 29, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 21, "n_attrs": 12, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_vl.NemotronVLProcessingInfo", "methods": [ { "kind": "function", "name": "NemotronVLProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemotronVLProcessingInfo.get_image_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.nemotron_vl.image_to_pixel_values_nemotron_vl", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_vl.LlamaNemotronVLChatModel", "methods": [ { "kind": "function", "name": "LlamaNemotronVLChatModel.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlamaNemotronVLChatModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlamaNemotronVLChatModel._patch_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlamaNemotronVLChatModel._init_vision_model", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LlamaNemotronVLChatModel._init_mlp1", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LlamaNemotronVLChatModel.pixel_shuffle", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlamaNemotronVLChatModel._call_vision_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaNemotronVLChatModel.extract_feature", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaNemotronVLChatModel._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaNemotronVLChatModel._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaNemotronVLChatModel._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaNemotronVLChatModel._set_visual_token_mask", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaNemotronVLChatModel.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaNemotronVLChatModel.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LlamaNemotronVLChatModel.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LlamaNemotronVLChatModel.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaNemotronVLChatModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaNemotronVLChatModel.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlamaNemotronVLChatModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaNemotronVLChatModel.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaNemotronVLChatModel.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaNemotronVLChatModel.num_image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaNemotronVLChatModel.downsample_ratio", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaNemotronVLChatModel.ps_version", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaNemotronVLChatModel.img_context_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaNemotronVLChatModel.visual_token_mask", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaNemotronVLChatModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaNemotronVLChatModel.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaNemotronVLChatModel.mlp1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaNemotronVLChatModel.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 62, "n_typed": 45, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 32, "n_attrs": 12, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.nemotron_vl.dynamic_preprocess_nemotron_vl", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_vl.LlamaNemotronVLEmbedProcessor", "methods": [ { "kind": "function", "name": "LlamaNemotronVLEmbedProcessor.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "LlamaNemotronVLEmbedProcessor._get_transform", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LlamaNemotronVLEmbedProcessor._replace_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlamaNemotronVLEmbedProcessor.IMG_CONTEXT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_vl.LlamaNemotronVLForEmbedding", "methods": [ { "kind": "function", "name": "LlamaNemotronVLForEmbedding.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LlamaNemotronVLForEmbedding._init_vision_model", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LlamaNemotronVLForEmbedding._init_mlp1", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaNemotronVLForEmbedding._call_vision_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LlamaNemotronVLForEmbedding.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LlamaNemotronVLForEmbedding.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LlamaNemotronVLForEmbedding.weight_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaNemotronVLForEmbedding.img_context_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LlamaNemotronVLForEmbedding.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 12, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.nemotron_vl.find_closest_aspect_ratio", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.nemotron_vl.LlamaNemotronVLEmbedProcessingInfo", "methods": [ { "kind": "function", "name": "LlamaNemotronVLEmbedProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.nemotron_vl", "names": [ "vllm.model_executor.models.nemotron_vl.LlamaNemotronVLChatModel", "vllm.model_executor.models.nemotron_vl.LlamaNemotronVLEmbedProcessingInfo", "vllm.model_executor.models.nemotron_vl.LlamaNemotronVLEmbedProcessor", "vllm.model_executor.models.nemotron_vl.LlamaNemotronVLForEmbedding", "vllm.model_executor.models.nemotron_vl.LlamaNemotronVLForSequenceClassification", "vllm.model_executor.models.nemotron_vl.NemotronVLProcessingInfo", "vllm.model_executor.models.nemotron_vl.NemotronVLProcessor", "vllm.model_executor.models.nemotron_vl.SIGLIP_MEAN", "vllm.model_executor.models.nemotron_vl.SIGLIP_STD", "vllm.model_executor.models.nemotron_vl.build_siglip_transform", "vllm.model_executor.models.nemotron_vl.build_transform", "vllm.model_executor.models.nemotron_vl.calculate_nemotron_vl_targets", "vllm.model_executor.models.nemotron_vl.dynamic_preprocess_nemotron_vl", "vllm.model_executor.models.nemotron_vl.find_closest_aspect_ratio", "vllm.model_executor.models.nemotron_vl.get_nemotron_vl_target_ratios", "vllm.model_executor.models.nemotron_vl.image_to_pixel_values_nemotron_vl" ], "n_typable": 172, "n_typed": 136, "n_any": 0, "n_untyped": 36, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 24, "n_methods": 38, "n_method_overloads": 38, "n_method_params": 75, "n_classes": 7, "n_attrs": 34, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/nvlm_d.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.nvlm_d.NVLMDummyInputsBuilder", "methods": [ { "kind": "function", "name": "NVLMDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NVLMDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nvlm_d.NVLMProcessingInfo", "methods": [ { "kind": "function", "name": "NVLMProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nvlm_d.NVLMMultiModalProcessor", "methods": [ { "kind": "function", "name": "NVLMMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nvlm_d.NVLM_D_Model", "methods": [ { "kind": "function", "name": "NVLM_D_Model._init_mlp1", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NVLM_D_Model._init_vision_model", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.nvlm_d.IMG_PAD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.nvlm_d.NVLMProcessor", "methods": [ { "kind": "function", "name": "NVLMProcessor.get_image_repl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "NVLMProcessor.image_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.nvlm_d", "names": [ "vllm.model_executor.models.nvlm_d.IMG_PAD", "vllm.model_executor.models.nvlm_d.NVLMDummyInputsBuilder", "vllm.model_executor.models.nvlm_d.NVLMMultiModalProcessor", "vllm.model_executor.models.nvlm_d.NVLMProcessingInfo", "vllm.model_executor.models.nvlm_d.NVLMProcessor", "vllm.model_executor.models.nvlm_d.NVLM_D_Model" ], "n_typable": 23, "n_typed": 22, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 15, "n_classes": 5, "n_attrs": 1, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/olmo.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.olmo.OlmoAttention", "methods": [ { "kind": "function", "name": "OlmoAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OlmoAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OlmoAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoAttention.clip_qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 7, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.olmo.OlmoForCausalLM", "methods": [ { "kind": "function", "name": "OlmoForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OlmoForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OlmoForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OlmoForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OlmoForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OlmoForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OlmoForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 13, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.olmo.OlmoMLP", "methods": [ { "kind": "function", "name": "OlmoMLP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OlmoMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OlmoMLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoMLP.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoMLP.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 5, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.olmo.OlmoModel", "methods": [ { "kind": "function", "name": "OlmoModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OlmoModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OlmoModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OlmoModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OlmoModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.olmo.OlmoDecoderLayer", "methods": [ { "kind": "function", "name": "OlmoDecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OlmoDecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OlmoDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.olmo", "names": [ "vllm.model_executor.models.olmo.OlmoAttention", "vllm.model_executor.models.olmo.OlmoDecoderLayer", "vllm.model_executor.models.olmo.OlmoForCausalLM", "vllm.model_executor.models.olmo.OlmoMLP", "vllm.model_executor.models.olmo.OlmoModel" ], "n_typable": 79, "n_typed": 43, "n_any": 0, "n_untyped": 36, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 33, "n_classes": 5, "n_attrs": 32, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/olmo2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.olmo2.Olmo2ForCausalLM", "methods": [ { "kind": "function", "name": "Olmo2ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Olmo2ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Olmo2ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Olmo2ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Olmo2ForCausalLM.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Olmo2ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Olmo2ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 12, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.olmo2.Olmo2Model", "methods": [ { "kind": "function", "name": "Olmo2Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Olmo2Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Olmo2Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Olmo2Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Olmo2Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.olmo2.Olmo2Attention", "methods": [ { "kind": "function", "name": "Olmo2Attention.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Olmo2Attention._apply_qk_norm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Olmo2Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Olmo2Attention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 8, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.olmo2.Olmo2MLP", "methods": [ { "kind": "function", "name": "Olmo2MLP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Olmo2MLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Olmo2MLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2MLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2MLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 4, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.olmo2.Olmo2DecoderLayer", "methods": [ { "kind": "function", "name": "Olmo2DecoderLayer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Olmo2DecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Olmo2DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo2DecoderLayer.post_feedforward_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.olmo2", "names": [ "vllm.model_executor.models.olmo2.Olmo2Attention", "vllm.model_executor.models.olmo2.Olmo2DecoderLayer", "vllm.model_executor.models.olmo2.Olmo2ForCausalLM", "vllm.model_executor.models.olmo2.Olmo2MLP", "vllm.model_executor.models.olmo2.Olmo2Model" ], "n_typable": 80, "n_typed": 40, "n_any": 0, "n_untyped": 40, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 30, "n_classes": 5, "n_attrs": 35, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/olmoe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.olmoe.OlmoeDecoderLayer", "methods": [ { "kind": "function", "name": "OlmoeDecoderLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OlmoeDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OlmoeDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.olmoe.OlmoeMoE", "methods": [ { "kind": "function", "name": "OlmoeMoE.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "OlmoeMoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OlmoeMoE.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeMoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeMoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 10, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.olmoe.OlmoeModel", "methods": [ { "kind": "function", "name": "OlmoeModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OlmoeModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OlmoeModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OlmoeModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OlmoeModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OlmoeModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 13, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.olmoe.OlmoeForCausalLM", "methods": [ { "kind": "function", "name": "OlmoeForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OlmoeForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OlmoeForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OlmoeForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OlmoeForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OlmoeForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OlmoeForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OlmoeForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 15, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 10, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.olmoe.OlmoeAttention", "methods": [ { "kind": "function", "name": "OlmoeAttention.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OlmoeAttention._apply_qk_norm", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OlmoeAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OlmoeAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OlmoeAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 9, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 18, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.olmoe.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.olmoe", "names": [ "vllm.model_executor.models.olmoe.OlmoeAttention", "vllm.model_executor.models.olmoe.OlmoeDecoderLayer", "vllm.model_executor.models.olmoe.OlmoeForCausalLM", "vllm.model_executor.models.olmoe.OlmoeMoE", "vllm.model_executor.models.olmoe.OlmoeModel", "vllm.model_executor.models.olmoe.logger" ], "n_typable": 95, "n_typed": 54, "n_any": 0, "n_untyped": 41, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 39, "n_classes": 5, "n_attrs": 39, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/opencua.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.opencua.OpenCUAProcessor", "methods": [ { "kind": "function", "name": "OpenCUAProcessor.check_argument_for_proper_class", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenCUAProcessor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenCUAProcessor.__call__", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenCUAProcessor.image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 5, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.opencua.OpenCUAForConditionalGeneration", "methods": [ { "kind": "function", "name": "OpenCUAForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenCUAForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenCUAForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OpenCUAForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenCUAForConditionalGeneration.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OpenCUAForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenCUAForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenCUAForConditionalGeneration.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenCUAForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenCUAForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenCUAForConditionalGeneration.is_multimodal_pruning_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenCUAForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenCUAForConditionalGeneration.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenCUAForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 5, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.opencua.OpenCUAProcessingInfo", "methods": [ { "kind": "function", "name": "OpenCUAProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OpenCUAProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OpenCUAProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OpenCUAProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.opencua.OpenCUADummyInputsBuilder", "methods": [ { "kind": "function", "name": "OpenCUADummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.opencua.OpenCUAMultiModalProcessor", "methods": [ { "kind": "function", "name": "OpenCUAMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenCUAMultiModalProcessor._hf_processor_applies_updates", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OpenCUAMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.opencua", "names": [ "vllm.model_executor.models.opencua.OpenCUADummyInputsBuilder", "vllm.model_executor.models.opencua.OpenCUAForConditionalGeneration", "vllm.model_executor.models.opencua.OpenCUAMultiModalProcessor", "vllm.model_executor.models.opencua.OpenCUAProcessingInfo", "vllm.model_executor.models.opencua.OpenCUAProcessor" ], "n_typable": 48, "n_typed": 26, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 24, "n_classes": 5, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/openpangu.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.openpangu.OpenPanguMLAAttention", "methods": [ { "kind": "function", "name": "OpenPanguMLAAttention.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "OpenPanguMLAAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguMLAAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.qk_nope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.qk_rope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.qk_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.kv_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.num_local_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.kv_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.kv_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.mla_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.fused_qkv_a_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.q_a_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.q_b_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.q_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLAAttention.kv_a_proj_with_mqa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 39, "n_typed": 16, "n_any": 0, "n_untyped": 23, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 14, "n_attrs": 23, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu.PanguProMoEV2ForCausalLM", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu.OpenPanguEmbeddedAttention", "methods": [ { "kind": "function", "name": "OpenPanguEmbeddedAttention.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "OpenPanguEmbeddedAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenPanguEmbeddedAttention._init_rotary_emb", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguEmbeddedAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguEmbeddedAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguEmbeddedAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguEmbeddedAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguEmbeddedAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguEmbeddedAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguEmbeddedAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguEmbeddedAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguEmbeddedAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguEmbeddedAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguEmbeddedAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguEmbeddedAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguEmbeddedAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 18, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 15, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu.OpenPanguMLP", "methods": [ { "kind": "function", "name": "OpenPanguMLP.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "OpenPanguMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 10, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu.OpenPanguModelBase", "methods": [ { "kind": "function", "name": "OpenPanguModelBase.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenPanguModelBase.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguModelBase.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OpenPanguModelBase.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguModelBase.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguModelBase.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OpenPanguModelBase.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguModelBase.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguModelBase.fuse_qkv_a_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguModelBase.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguModelBase.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguModelBase.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguModelBase.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 13, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu.OpenPanguEmbeddedModel", "methods": [ { "kind": "function", "name": "OpenPanguEmbeddedModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu.PanguEmbeddedForCausalLM", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu.OpenPanguSinkAttention", "methods": [ { "kind": "function", "name": "OpenPanguSinkAttention.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "OpenPanguSinkAttention.weight_loader", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenPanguSinkAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenPanguSinkAttention._init_rotary_emb", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenPanguSinkAttention.post_weight_load", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguSinkAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.qk_nope_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.qk_rope_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.v_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.k_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.v_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.param_sink_number", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.param_sink_with_value", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.param_sink_scalar", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.param_sink_of_head_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.k_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.param_sink_key", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguSinkAttention.param_sink_value", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 50, "n_typed": 23, "n_any": 0, "n_untyped": 27, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 19, "n_attrs": 26, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu.OpenPanguDecoderLayer", "methods": [ { "kind": "function", "name": "OpenPanguDecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenPanguDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguDecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguDecoderLayer.use_mla", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguDecoderLayer.use_sink_attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguDecoderLayer.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguDecoderLayer.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguDecoderLayer.first_k_dense_replace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguDecoderLayer.tp_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguDecoderLayer.sandwich_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguDecoderLayer.pre_mlp_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguDecoderLayer.post_mlp_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 8, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu.PanguUltraMoEForCausalLM", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.openpangu.check_ffn_act_fn", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu.OpenPanguMoE", "methods": [ { "kind": "function", "name": "OpenPanguMoE.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OpenPanguMoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguMoE.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.n_routed_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.n_shared_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.is_sequence_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoE.shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 8, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 19, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu.OpenPanguModel", "methods": [ { "kind": "function", "name": "OpenPanguModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenPanguModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OpenPanguModel.load_attn_mlp_weight", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OpenPanguModel.load_expert_weight", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "OpenPanguModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguModel.post_weight_load", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguModel.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OpenPanguModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguModel.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 25, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 19, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu.OpenPanguMoEModel", "methods": [ { "kind": "function", "name": "OpenPanguMoEModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenPanguMoEModel.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguMoEModel.expert_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoEModel.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoEModel.num_expert_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoEModel.moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoEModel.num_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoEModel.num_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoEModel.num_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoEModel.n_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoEModel.n_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMoEModel.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 5, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.openpangu", "names": [ "vllm.model_executor.models.openpangu.OpenPanguDecoderLayer", "vllm.model_executor.models.openpangu.OpenPanguEmbeddedAttention", "vllm.model_executor.models.openpangu.OpenPanguEmbeddedModel", "vllm.model_executor.models.openpangu.OpenPanguMLAAttention", "vllm.model_executor.models.openpangu.OpenPanguMLP", "vllm.model_executor.models.openpangu.OpenPanguMoE", "vllm.model_executor.models.openpangu.OpenPanguMoEModel", "vllm.model_executor.models.openpangu.OpenPanguModel", "vllm.model_executor.models.openpangu.OpenPanguModelBase", "vllm.model_executor.models.openpangu.OpenPanguSinkAttention", "vllm.model_executor.models.openpangu.PanguEmbeddedForCausalLM", "vllm.model_executor.models.openpangu.PanguProMoEV2ForCausalLM", "vllm.model_executor.models.openpangu.PanguUltraMoEForCausalLM", "vllm.model_executor.models.openpangu.check_ffn_act_fn" ], "n_typable": 257, "n_typed": 129, "n_any": 0, "n_untyped": 128, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 31, "n_method_overloads": 31, "n_method_params": 102, "n_classes": 13, "n_attrs": 124, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/openpangu_mtp.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.openpangu_mtp.OpenPanguMultiTokenPredictorLayer", "methods": [ { "kind": "function", "name": "OpenPanguMultiTokenPredictorLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguMultiTokenPredictorLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMultiTokenPredictorLayer.enorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMultiTokenPredictorLayer.hnorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMultiTokenPredictorLayer.eh_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMultiTokenPredictorLayer.shared_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMultiTokenPredictorLayer.mtp_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 3, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_mtp.OpenPanguMultiTokenPredictor", "methods": [ { "kind": "function", "name": "OpenPanguMultiTokenPredictor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguMultiTokenPredictor.mtp_start_layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMultiTokenPredictor.num_mtp_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMultiTokenPredictor.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMultiTokenPredictor.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMultiTokenPredictor.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 2, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_mtp.OpenPanguMTP", "methods": [ { "kind": "function", "name": "OpenPanguMTP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenPanguMTP.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguMTP.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "OpenPanguMTP.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenPanguMTP.get_spec_layer", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguMTP.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguMTP._rewrite_spec_layer_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguMTP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguMTP.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 19, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 15, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.openpangu_mtp", "names": [ "vllm.model_executor.models.openpangu_mtp.OpenPanguMTP", "vllm.model_executor.models.openpangu_mtp.OpenPanguMultiTokenPredictor", "vllm.model_executor.models.openpangu_mtp.OpenPanguMultiTokenPredictorLayer" ], "n_typable": 41, "n_typed": 24, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 19, "n_classes": 3, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/openpangu_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.OpenPanguVLVideoPixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguVLVideoPixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVLVideoPixelInputs.pixel_values_videos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVLVideoPixelInputs.video_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.ProjectionSingle", "methods": [ { "kind": "function", "name": "ProjectionSingle.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ProjectionSingle.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ProjectionSingle.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ProjectionSingle.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 2, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.OpenPanguVLDummyInputsBuilder", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.OpenPanguVisionAttention", "methods": [ { "kind": "function", "name": "OpenPanguVisionAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OpenPanguVisionAttention.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguVisionAttention.hidden_size_per_attention_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionAttention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionAttention.num_attention_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionAttention.qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionAttention.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionAttention.apply_rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 11, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.OpenPanguVLForConditionalGeneration", "methods": [ { "kind": "function", "name": "OpenPanguVLForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration._parse_preprocess_params", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration._maybe_ignore_quant_config", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration._validate_and_reshape_mm_tensor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration._parse_and_validate_image_input", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration._parse_and_validate_video_input", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration.get_input_embeddings", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration._process_image_input", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration._process_video_input", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration.iter_mm_grid_thw", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguVLForConditionalGeneration.get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguVLForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVLForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OpenPanguVLForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVLForConditionalGeneration.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVLForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVLForConditionalGeneration.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVLForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 51, "n_typed": 35, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 27, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.openpangu_vl.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.OpenPanguVLImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguVLImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVLImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVLImagePixelInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.openpangu_vl.normalize", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.models.openpangu_vl.rescale", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.OpenPanguVisionPatchEmbed", "methods": [ { "kind": "function", "name": "OpenPanguVisionPatchEmbed.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OpenPanguVisionPatchEmbed.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguVisionPatchEmbed.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionPatchEmbed.temporal_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionPatchEmbed.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionPatchEmbed.input_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionPatchEmbed.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.OpenPanguVisionRotaryEmbedding", "methods": [ { "kind": "function", "name": "OpenPanguVisionRotaryEmbedding.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenPanguVisionRotaryEmbedding.update_freqs_cache", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguVisionRotaryEmbedding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguVisionRotaryEmbedding.inv_freq", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.OpenPanguVLProcessingInfo", "methods": [ { "kind": "function", "name": "OpenPanguVLProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OpenPanguVLProcessingInfo.get_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.openpangu_vl.rescale_and_normalize", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.OpenPanguVisionPatchMerger", "methods": [ { "kind": "function", "name": "OpenPanguVisionPatchMerger.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "OpenPanguVisionPatchMerger.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguVisionPatchMerger.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionPatchMerger.ln_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionPatchMerger.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.OpenPanguVLImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguVLImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVLImageEmbeddingInputs.image_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVLImageEmbeddingInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.OpenPanguVLVideoEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguVLVideoEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVLVideoEmbeddingInputs.video_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVLVideoEmbeddingInputs.video_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.OpenPanguVisionBlock", "methods": [ { "kind": "function", "name": "OpenPanguVisionBlock.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "OpenPanguVisionBlock.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguVisionBlock.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionBlock.norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 13, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.OpenPanguVLMultiModalProcessor", "methods": [ { "kind": "function", "name": "OpenPanguVLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.OpenPanguVisionTransformer", "methods": [ { "kind": "function", "name": "OpenPanguVisionTransformer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "OpenPanguVisionTransformer.cal_cos_sin", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguVisionTransformer.rot_pos_emb", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguVisionTransformer.get_window_index", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenPanguVisionTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OpenPanguVisionTransformer.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "OpenPanguVisionTransformer.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "OpenPanguVisionTransformer.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "OpenPanguVisionTransformer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.window_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.fullatt_block_indexes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.spatial_merge_unit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.interleaved", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.out_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.rotary_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.patch_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.hidden_size_per_attention_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.select_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.select_index", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.take_indices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.final_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.merger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionTransformer.vision_projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 44, "n_typed": 12, "n_any": 0, "n_untyped": 32, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 13, "n_attrs": 23, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.openpangu_vl.OpenPanguVisionMLP", "methods": [ { "kind": "function", "name": "OpenPanguVisionMLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "OpenPanguVisionMLP.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OpenPanguVisionMLP.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OpenPanguVisionMLP.up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 7, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.openpangu_vl", "names": [ "vllm.model_executor.models.openpangu_vl.OpenPanguVLDummyInputsBuilder", "vllm.model_executor.models.openpangu_vl.OpenPanguVLForConditionalGeneration", "vllm.model_executor.models.openpangu_vl.OpenPanguVLImageEmbeddingInputs", "vllm.model_executor.models.openpangu_vl.OpenPanguVLImagePixelInputs", "vllm.model_executor.models.openpangu_vl.OpenPanguVLMultiModalProcessor", "vllm.model_executor.models.openpangu_vl.OpenPanguVLProcessingInfo", "vllm.model_executor.models.openpangu_vl.OpenPanguVLVideoEmbeddingInputs", "vllm.model_executor.models.openpangu_vl.OpenPanguVLVideoPixelInputs", "vllm.model_executor.models.openpangu_vl.OpenPanguVisionAttention", "vllm.model_executor.models.openpangu_vl.OpenPanguVisionBlock", "vllm.model_executor.models.openpangu_vl.OpenPanguVisionMLP", "vllm.model_executor.models.openpangu_vl.OpenPanguVisionPatchEmbed", "vllm.model_executor.models.openpangu_vl.OpenPanguVisionPatchMerger", "vllm.model_executor.models.openpangu_vl.OpenPanguVisionRotaryEmbedding", "vllm.model_executor.models.openpangu_vl.OpenPanguVisionTransformer", "vllm.model_executor.models.openpangu_vl.ProjectionSingle", "vllm.model_executor.models.openpangu_vl.logger", "vllm.model_executor.models.openpangu_vl.normalize", "vllm.model_executor.models.openpangu_vl.rescale", "vllm.model_executor.models.openpangu_vl.rescale_and_normalize" ], "n_typable": 225, "n_typed": 132, "n_any": 0, "n_untyped": 93, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 12, "n_methods": 42, "n_method_overloads": 42, "n_method_params": 96, "n_classes": 16, "n_attrs": 71, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/opt.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.opt.OPTDecoderLayer", "methods": [ { "kind": "function", "name": "OPTDecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OPTDecoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OPTDecoderLayer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTDecoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTDecoderLayer.do_layer_norm_before", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTDecoderLayer.self_attn_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTDecoderLayer.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTDecoderLayer.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTDecoderLayer.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTDecoderLayer.final_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 6, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.opt.OPTModel", "methods": [ { "kind": "function", "name": "OPTModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OPTModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OPTModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OPTModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OPTModel.decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 11, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.opt.OPTLearnedPositionalEmbedding", "methods": [ { "kind": "function", "name": "OPTLearnedPositionalEmbedding.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OPTLearnedPositionalEmbedding.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OPTLearnedPositionalEmbedding.offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.opt.OPTDecoder", "methods": [ { "kind": "function", "name": "OPTDecoder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OPTDecoder.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OPTDecoder.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OPTDecoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTDecoder.max_target_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTDecoder.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTDecoder.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTDecoder.embed_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTDecoder.project_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTDecoder.project_in", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTDecoder.final_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 11, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.opt.OPTAttention", "methods": [ { "kind": "function", "name": "OPTAttention.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "OPTAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OPTAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 9, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.opt.OPTForCausalLM", "methods": [ { "kind": "function", "name": "OPTForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OPTForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OPTForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OPTForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OPTForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OPTForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OPTForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OPTForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 13, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.opt", "names": [ "vllm.model_executor.models.opt.OPTAttention", "vllm.model_executor.models.opt.OPTDecoder", "vllm.model_executor.models.opt.OPTDecoderLayer", "vllm.model_executor.models.opt.OPTForCausalLM", "vllm.model_executor.models.opt.OPTLearnedPositionalEmbedding", "vllm.model_executor.models.opt.OPTModel" ], "n_typable": 93, "n_typed": 53, "n_any": 0, "n_untyped": 40, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 41, "n_classes": 6, "n_attrs": 35, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/orion.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.orion.OrionModel", "methods": [ { "kind": "function", "name": "OrionModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OrionModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OrionModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OrionModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OrionModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.orion.OrionMLP", "methods": [ { "kind": "function", "name": "OrionMLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OrionMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OrionMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.orion.OrionAttention", "methods": [ { "kind": "function", "name": "OrionAttention.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "OrionAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OrionAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 12, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.orion.OrionDecoderLayer", "methods": [ { "kind": "function", "name": "OrionDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OrionDecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OrionDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.orion.OrionForCausalLM", "methods": [ { "kind": "function", "name": "OrionForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OrionForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OrionForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OrionForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OrionForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OrionForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OrionForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.orion", "names": [ "vllm.model_executor.models.orion.OrionAttention", "vllm.model_executor.models.orion.OrionDecoderLayer", "vllm.model_executor.models.orion.OrionForCausalLM", "vllm.model_executor.models.orion.OrionMLP", "vllm.model_executor.models.orion.OrionModel" ], "n_typable": 87, "n_typed": 50, "n_any": 0, "n_untyped": 37, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 39, "n_classes": 5, "n_attrs": 33, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/ouro.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.ouro.OuroModel", "methods": [ { "kind": "function", "name": "OuroModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OuroModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OuroModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OuroModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OuroModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroModel.early_exit_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroModel.total_ut_steps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 12, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ouro.OuroMLP", "methods": [ { "kind": "function", "name": "OuroMLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OuroMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OuroMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ouro.OuroForCausalLM", "methods": [ { "kind": "function", "name": "OuroForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OuroForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OuroForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OuroForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OuroForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OuroForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OuroForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ouro.OuroAttention", "methods": [ { "kind": "function", "name": "OuroAttention.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "OuroAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OuroAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroAttention.dual_chunk_attention_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 15, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 13, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ouro.OuroDecoderLayer", "methods": [ { "kind": "function", "name": "OuroDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OuroDecoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OuroDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroDecoderLayer.input_layernorm_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OuroDecoderLayer.post_attention_layernorm_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 10, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.ouro", "names": [ "vllm.model_executor.models.ouro.OuroAttention", "vllm.model_executor.models.ouro.OuroDecoderLayer", "vllm.model_executor.models.ouro.OuroForCausalLM", "vllm.model_executor.models.ouro.OuroMLP", "vllm.model_executor.models.ouro.OuroModel" ], "n_typable": 98, "n_typed": 56, "n_any": 0, "n_untyped": 42, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 45, "n_classes": 5, "n_attrs": 39, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/ovis.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.ovis.st_argmax", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.ovis.VisualTokenizer", "methods": [ { "kind": "function", "name": "VisualTokenizer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VisualTokenizer._init_backbone", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VisualTokenizer.tokenize", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VisualTokenizer.encode", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VisualTokenizer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "VisualTokenizer.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VisualTokenizer.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "VisualTokenizer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualTokenizer.backbone", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualTokenizer.head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 15, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 3, "n_properties": 2 }, { "kind": "attr", "name": "vllm.model_executor.models.ovis.IMAGE_PAD_TOKEN_ID_MAP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.ovis.IMAGE_INDICATOR_IDS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.ovis.IMAGE_PAD_TOKEN_MAP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ovis.Ovis", "methods": [ { "kind": "function", "name": "Ovis.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ovis.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ovis._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Ovis.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ovis.config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ovis.image_pad_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ovis.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ovis.llm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ovis.visual_tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ovis.vte", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 22, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 14, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ovis.OvisDummyInputsBuilder", "methods": [ { "kind": "function", "name": "OvisDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OvisDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ovis.OvisImagePatchInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "OvisImagePatchInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OvisImagePatchInputs.flat_data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OvisImagePatchInputs.indicator_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OvisImagePatchInputs.patches_per_image", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ovis.OvisProcessingInfo", "methods": [ { "kind": "function", "name": "OvisProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OvisProcessingInfo.get_default_tok_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OvisProcessingInfo.get_image_segment_len", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OvisProcessingInfo.get_image_pad_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OvisProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OvisProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ovis.OvisMultiModalProcessor", "methods": [ { "kind": "function", "name": "OvisMultiModalProcessor.image_indicators_to_visual_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OvisMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OvisMultiModalProcessor._apply_hf_processor_tokens_only", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OvisMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OvisMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.ovis.IMAGE_TOKEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ovis.VisualEmbedding", "methods": [ { "kind": "function", "name": "VisualEmbedding.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VisualEmbedding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "VisualEmbedding.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "VisualEmbedding.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [], "n_typable": 7, "n_typed": 2, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 0, "n_properties": 2 } ], "type_ignores": [], "name": "vllm.model_executor.models.ovis", "names": [ "vllm.model_executor.models.ovis.IMAGE_INDICATOR_IDS", "vllm.model_executor.models.ovis.IMAGE_PAD_TOKEN_ID_MAP", "vllm.model_executor.models.ovis.IMAGE_PAD_TOKEN_MAP", "vllm.model_executor.models.ovis.IMAGE_TOKEN", "vllm.model_executor.models.ovis.Ovis", "vllm.model_executor.models.ovis.OvisDummyInputsBuilder", "vllm.model_executor.models.ovis.OvisImagePatchInputs", "vllm.model_executor.models.ovis.OvisMultiModalProcessor", "vllm.model_executor.models.ovis.OvisProcessingInfo", "vllm.model_executor.models.ovis.VisualEmbedding", "vllm.model_executor.models.ovis.VisualTokenizer", "vllm.model_executor.models.ovis.st_argmax" ], "n_typable": 90, "n_typed": 73, "n_any": 0, "n_untyped": 17, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 28, "n_method_overloads": 28, "n_method_params": 42, "n_classes": 7, "n_attrs": 17, "n_properties": 4, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/ovis2_5.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.ovis2_5.Ovis2_5", "methods": [ { "kind": "function", "name": "Ovis2_5.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ovis2_5.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ovis2_5._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis2_5._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis2_5._process_visual_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis2_5._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis2_5.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis2_5.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Ovis2_5.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis2_5.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ovis2_5.config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5.image_pad_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5.llm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5.visual_tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5.vte", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 27, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 16, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ovis2_5.VisualTokenizer", "methods": [ { "kind": "function", "name": "VisualTokenizer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "VisualTokenizer._init_backbone", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VisualTokenizer.tokenize", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VisualTokenizer.encode", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VisualTokenizer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "VisualTokenizer.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VisualTokenizer.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "VisualTokenizer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualTokenizer.vit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualTokenizer.head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 17, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 3, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.ovis2_5.Ovis2_5VideoPatchInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Ovis2_5VideoPatchInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5VideoPatchInputs.flat_data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5VideoPatchInputs.indicator_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5VideoPatchInputs.patches_per_item", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5VideoPatchInputs.grids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.ovis2_5.IMAGE_PAD_TOKEN_ID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ovis2_5.Ovis2_5ProcessingInfo", "methods": [ { "kind": "function", "name": "Ovis2_5ProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Ovis2_5ProcessingInfo.get_hf_processor", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis2_5ProcessingInfo.get_default_tok_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Ovis2_5ProcessingInfo.get_image_processor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Ovis2_5ProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Ovis2_5ProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Ovis2_5ProcessingInfo.get_num_image_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Ovis2_5ProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Ovis2_5ProcessingInfo._get_max_video_frames", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis2_5ProcessingInfo.get_num_frames_with_most_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ovis2_5ProcessingInfo.get_num_video_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Ovis2_5ProcessingInfo.get_max_video_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 24, "n_typed": 21, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 12, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.ovis2_5.VIDEO_TOKEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.ovis2_5.IMAGE_TOKEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ovis2_5.Ovis2_5ImagePatchInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Ovis2_5ImagePatchInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5ImagePatchInputs.flat_data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5ImagePatchInputs.indicator_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5ImagePatchInputs.patches_per_item", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5ImagePatchInputs.grids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ovis2_5.Ovis2_5DummyInputsBuilder", "methods": [ { "kind": "function", "name": "Ovis2_5DummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis2_5DummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.ovis2_5.INDICATOR_IDS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ovis2_5.Ovis2_5MultiModalProcessor", "methods": [ { "kind": "function", "name": "Ovis2_5MultiModalProcessor.visual_indicators_to_visual_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis2_5MultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Ovis2_5MultiModalProcessor._apply_hf_processor_tokens_only", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis2_5MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ovis2_5MultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.ovis2_5", "names": [ "vllm.model_executor.models.ovis2_5.IMAGE_PAD_TOKEN_ID", "vllm.model_executor.models.ovis2_5.IMAGE_TOKEN", "vllm.model_executor.models.ovis2_5.INDICATOR_IDS", "vllm.model_executor.models.ovis2_5.Ovis2_5", "vllm.model_executor.models.ovis2_5.Ovis2_5DummyInputsBuilder", "vllm.model_executor.models.ovis2_5.Ovis2_5ImagePatchInputs", "vllm.model_executor.models.ovis2_5.Ovis2_5MultiModalProcessor", "vllm.model_executor.models.ovis2_5.Ovis2_5ProcessingInfo", "vllm.model_executor.models.ovis2_5.Ovis2_5VideoPatchInputs", "vllm.model_executor.models.ovis2_5.VIDEO_TOKEN", "vllm.model_executor.models.ovis2_5.VisualTokenizer" ], "n_typable": 110, "n_typed": 97, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 34, "n_method_overloads": 34, "n_method_params": 55, "n_classes": 7, "n_attrs": 23, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/paddleocr_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.paddleocr_vl.PaddleOCRVLDummyInputsBuilder", "methods": [ { "kind": "function", "name": "PaddleOCRVLDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PaddleOCRVLDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.paddleocr_vl.SiglipAttention", "methods": [ { "kind": "function", "name": "SiglipAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "SiglipAttention.split_qkv", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SiglipAttention.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.hidden_size_per_attention_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.num_attention_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.apply_rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 13, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.paddleocr_vl.PaddleOCRVLForConditionalGeneration", "methods": [ { "kind": "function", "name": "PaddleOCRVLForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PaddleOCRVLForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PaddleOCRVLForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PaddleOCRVLForConditionalGeneration.get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PaddleOCRVLForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PaddleOCRVLForConditionalGeneration.forward", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PaddleOCRVLForConditionalGeneration.encode_image", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PaddleOCRVLForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PaddleOCRVLForConditionalGeneration.embed_multimodal", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PaddleOCRVLForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PaddleOCRVLForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PaddleOCRVLForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PaddleOCRVLForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PaddleOCRVLForConditionalGeneration.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PaddleOCRVLForConditionalGeneration.mlp_AR", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PaddleOCRVLForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 24, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 18, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.paddleocr_vl.smart_resize", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.paddleocr_vl.PaddleOCRVLProcessingInfo", "methods": [ { "kind": "function", "name": "PaddleOCRVLProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PaddleOCRVLProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PaddleOCRVLProcessingInfo.get_image_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PaddleOCRVLProcessingInfo.get_supported_mm_limits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PaddleOCRVLProcessingInfo.get_num_image_tokens", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PaddleOCRVLProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.paddleocr_vl.SiglipVisionEmbeddings", "methods": [ { "kind": "function", "name": "SiglipVisionEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SiglipVisionEmbeddings.interpolate_pos_encoding", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SiglipVisionEmbeddings.fetch_position_embedding_lfu_cache", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SiglipVisionEmbeddings.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipVisionEmbeddings.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.num_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.cache_position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.cache_position_count", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.packing_position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 14, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.paddleocr_vl.SiglipEncoder", "methods": [ { "kind": "function", "name": "SiglipEncoder.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SiglipEncoder.flatten_list", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SiglipEncoder.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipEncoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEncoder.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEncoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEncoder.rotary_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 8, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.paddleocr_vl.all_gather_interleave", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.models.paddleocr_vl.PaddleOCRImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PaddleOCRImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PaddleOCRImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PaddleOCRImagePixelInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.paddleocr_vl.SigLIPRotaryEmbedding", "methods": [ { "kind": "function", "name": "SigLIPRotaryEmbedding.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SigLIPRotaryEmbedding.rope_init", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SigLIPRotaryEmbedding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SigLIPRotaryEmbedding.dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SigLIPRotaryEmbedding.theta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.paddleocr_vl.Projector", "methods": [ { "kind": "function", "name": "Projector.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Projector.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Projector.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Projector.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Projector.merge_kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Projector.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Projector.pre_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Projector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Projector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Projector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 6, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.paddleocr_vl.SiglipEncoderLayer", "methods": [ { "kind": "function", "name": "SiglipEncoderLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SiglipEncoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipEncoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEncoderLayer.layer_norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEncoderLayer.layer_norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 8, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.paddleocr_vl.SiglipVisionTransformer", "methods": [ { "kind": "function", "name": "SiglipVisionTransformer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SiglipVisionTransformer.forward", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipVisionTransformer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionTransformer.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionTransformer.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionTransformer.post_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.paddleocr_vl.PaddleOCRVLMultiModalProcessor", "methods": [ { "kind": "function", "name": "PaddleOCRVLMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PaddleOCRVLMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PaddleOCRVLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.paddleocr_vl.SiglipVisionModel", "methods": [ { "kind": "function", "name": "SiglipVisionModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SiglipVisionModel.get_input_embeddings", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SiglipVisionModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "SiglipVisionModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "SiglipVisionModel.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "SiglipVisionModel.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "SiglipVisionModel.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 2, "n_properties": 2 } ], "type_ignores": [], "name": "vllm.model_executor.models.paddleocr_vl", "names": [ "vllm.model_executor.models.paddleocr_vl.PaddleOCRImagePixelInputs", "vllm.model_executor.models.paddleocr_vl.PaddleOCRVLDummyInputsBuilder", "vllm.model_executor.models.paddleocr_vl.PaddleOCRVLForConditionalGeneration", "vllm.model_executor.models.paddleocr_vl.PaddleOCRVLMultiModalProcessor", "vllm.model_executor.models.paddleocr_vl.PaddleOCRVLProcessingInfo", "vllm.model_executor.models.paddleocr_vl.Projector", "vllm.model_executor.models.paddleocr_vl.SigLIPRotaryEmbedding", "vllm.model_executor.models.paddleocr_vl.SiglipAttention", "vllm.model_executor.models.paddleocr_vl.SiglipEncoder", "vllm.model_executor.models.paddleocr_vl.SiglipEncoderLayer", "vllm.model_executor.models.paddleocr_vl.SiglipVisionEmbeddings", "vllm.model_executor.models.paddleocr_vl.SiglipVisionModel", "vllm.model_executor.models.paddleocr_vl.SiglipVisionTransformer", "vllm.model_executor.models.paddleocr_vl.all_gather_interleave", "vllm.model_executor.models.paddleocr_vl.smart_resize" ], "n_typable": 212, "n_typed": 138, "n_any": 0, "n_untyped": 74, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 8, "n_methods": 44, "n_method_overloads": 44, "n_method_params": 103, "n_classes": 13, "n_attrs": 53, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/paligemma.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.paligemma.PaliGemmaForConditionalGeneration", "methods": [ { "kind": "function", "name": "PaliGemmaForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PaliGemmaForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PaliGemmaForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PaliGemmaForConditionalGeneration._image_pixels_to_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PaliGemmaForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PaliGemmaForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PaliGemmaForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PaliGemmaForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PaliGemmaForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PaliGemmaForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PaliGemmaForConditionalGeneration.get_num_mm_encoder_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PaliGemmaForConditionalGeneration.get_num_mm_connector_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PaliGemmaForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PaliGemmaForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PaliGemmaForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PaliGemmaForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PaliGemmaForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PaliGemmaForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PaliGemmaForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PaliGemmaForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PaliGemmaForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 38, "n_typed": 29, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 18, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.paligemma.PaliGemmaMultiModalProjector", "methods": [ { "kind": "function", "name": "PaliGemmaMultiModalProjector.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PaliGemmaMultiModalProjector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PaliGemmaMultiModalProjector.linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.paligemma.PaliGemmaImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PaliGemmaImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PaliGemmaImagePixelInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.paligemma.PaliGemmaMultiModalProcessor", "methods": [ { "kind": "function", "name": "PaliGemmaMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PaliGemmaMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PaliGemmaMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PaliGemmaMultiModalProcessor.apply", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 15, "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.paligemma.PaliGemmaDummyInputsBuilder", "methods": [ { "kind": "function", "name": "PaliGemmaDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PaliGemmaDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.paligemma.PaliGemmaImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PaliGemmaImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PaliGemmaImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.paligemma.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.paligemma.PaliGemmaProcessingInfo", "methods": [ { "kind": "function", "name": "PaliGemmaProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PaliGemmaProcessingInfo.get_vision_encoder_info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PaliGemmaProcessingInfo.get_default_tok_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PaliGemmaProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PaliGemmaProcessingInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.paligemma.PaliGemmaImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.paligemma", "names": [ "vllm.model_executor.models.paligemma.PaliGemmaDummyInputsBuilder", "vllm.model_executor.models.paligemma.PaliGemmaForConditionalGeneration", "vllm.model_executor.models.paligemma.PaliGemmaImageEmbeddingInputs", "vllm.model_executor.models.paligemma.PaliGemmaImageInputs", "vllm.model_executor.models.paligemma.PaliGemmaImagePixelInputs", "vllm.model_executor.models.paligemma.PaliGemmaMultiModalProcessor", "vllm.model_executor.models.paligemma.PaliGemmaMultiModalProjector", "vllm.model_executor.models.paligemma.PaliGemmaProcessingInfo", "vllm.model_executor.models.paligemma.logger" ], "n_typable": 78, "n_typed": 64, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 25, "n_method_overloads": 25, "n_method_params": 38, "n_classes": 7, "n_attrs": 16, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/parakeet.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.parakeet.ParakeetProjection", "methods": [ { "kind": "function", "name": "ParakeetProjection.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParakeetProjection.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ParakeetProjection.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ParakeetProjection.linear1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ParakeetProjection.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ParakeetProjection.linear2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 4, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.parakeet.ParakeetExtractor", "methods": [ { "kind": "function", "name": "ParakeetExtractor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParakeetExtractor._normalize_audio_length", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParakeetExtractor.audio_token_count", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParakeetExtractor.__call__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ParakeetExtractor.audio_length", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ParakeetExtractor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 9, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 7, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.parakeet.ProjectedParakeet", "methods": [ { "kind": "function", "name": "ProjectedParakeet.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ProjectedParakeet.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ProjectedParakeet.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ProjectedParakeet.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ProjectedParakeet.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ProjectedParakeet.projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 10, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.parakeet", "names": [ "vllm.model_executor.models.parakeet.ParakeetExtractor", "vllm.model_executor.models.parakeet.ParakeetProjection", "vllm.model_executor.models.parakeet.ProjectedParakeet" ], "n_typable": 34, "n_typed": 23, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 16, "n_classes": 3, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/persimmon.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.persimmon.PersimmonAttention", "methods": [ { "kind": "function", "name": "PersimmonAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PersimmonAttention._split_heads", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PersimmonAttention._merge_heads", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PersimmonAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PersimmonAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonAttention.is_causal", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonAttention.query_key_value", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonAttention.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonAttention.is_qk_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonAttention.q_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonAttention.k_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 11, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.persimmon.PersimmonModel", "methods": [ { "kind": "function", "name": "PersimmonModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PersimmonModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PersimmonModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PersimmonModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PersimmonModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonModel.final_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.persimmon.PersimmonMLP", "methods": [ { "kind": "function", "name": "PersimmonMLP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PersimmonMLP.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PersimmonMLP.dense_h_to_4h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonMLP.dense_4h_to_h", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 4, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.persimmon.PersimmonForCausalLM", "methods": [ { "kind": "function", "name": "PersimmonForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PersimmonForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PersimmonForCausalLM.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PersimmonForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PersimmonForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PersimmonForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonForCausalLM.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 12, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.persimmon.PersimmonDecoderLayer", "methods": [ { "kind": "function", "name": "PersimmonDecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PersimmonDecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PersimmonDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PersimmonDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 7, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.persimmon", "names": [ "vllm.model_executor.models.persimmon.PersimmonAttention", "vllm.model_executor.models.persimmon.PersimmonDecoderLayer", "vllm.model_executor.models.persimmon.PersimmonForCausalLM", "vllm.model_executor.models.persimmon.PersimmonMLP", "vllm.model_executor.models.persimmon.PersimmonModel" ], "n_typable": 86, "n_typed": 45, "n_any": 0, "n_untyped": 41, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 35, "n_classes": 5, "n_attrs": 34, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/phi.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.phi.PhiLayer", "methods": [ { "kind": "function", "name": "PhiLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PhiLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PhiLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi.PhiMLP", "methods": [ { "kind": "function", "name": "PhiMLP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PhiMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PhiMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 3, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi.PhiForCausalLM", "methods": [ { "kind": "function", "name": "PhiForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PhiForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PhiForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PhiForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PhiForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PhiForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PhiForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi.PhiModel", "methods": [ { "kind": "function", "name": "PhiModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PhiModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PhiModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PhiModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PhiModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiModel.final_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi.PhiAttention", "methods": [ { "kind": "function", "name": "PhiAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PhiAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PhiAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiAttention.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiAttention.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 7, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.phi", "names": [ "vllm.model_executor.models.phi.PhiAttention", "vllm.model_executor.models.phi.PhiForCausalLM", "vllm.model_executor.models.phi.PhiLayer", "vllm.model_executor.models.phi.PhiMLP", "vllm.model_executor.models.phi.PhiModel" ], "n_typable": 72, "n_typed": 41, "n_any": 0, "n_untyped": 31, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 33, "n_classes": 5, "n_attrs": 25, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/phi3.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.phi3.Phi3ForCausalLM", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Phi3ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.phi3", "names": [ "vllm.model_executor.models.phi3.Phi3ForCausalLM" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/phi3v.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.phi3v.Phi3VImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.phi3v.Phi3HDImageEmbedding", "methods": [ { "kind": "function", "name": "Phi3HDImageEmbedding.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Phi3HDImageEmbedding.get_img_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi3HDImageEmbedding.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Phi3HDImageEmbedding.hd_feature_transform", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Phi3HDImageEmbedding.reshape_hd_patches_2x2merge", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Phi3HDImageEmbedding.add_image_newline", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Phi3HDImageEmbedding.img_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3HDImageEmbedding.num_img_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3HDImageEmbedding.image_dim_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3HDImageEmbedding.use_hd_transform", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3HDImageEmbedding.with_learnable_separator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3HDImageEmbedding.hd_transform_order", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3HDImageEmbedding.glb_GN", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3HDImageEmbedding.sub_GN", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3HDImageEmbedding.img_projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3HDImageEmbedding.type_feature", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 9, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi3v.Phi3VDummyInputsBuilder", "methods": [ { "kind": "function", "name": "Phi3VDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi3VDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.phi3v.CLIP_VIT_LARGE_PATCH14_336_CONFIG", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.phi3v.Phi3VImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Phi3VImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Phi3VImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Phi3VImagePixelInputs.image_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi3v.Phi3VImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Phi3VImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Phi3VImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi3v.Phi3VMultiModalProcessor", "methods": [ { "kind": "function", "name": "Phi3VMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Phi3VMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Phi3VMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Phi3VMultiModalProcessor._recompute_cached_prompt_update", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Phi3VMultiModalProcessor._apply_prompt_updates", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 18, "n_typed": 18, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi3v.Phi3VForCausalLM", "methods": [ { "kind": "function", "name": "Phi3VForCausalLM.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Phi3VForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Phi3VForCausalLM._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi3VForCausalLM._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi3VForCausalLM.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi3VForCausalLM.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Phi3VForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Phi3VForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi3VForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Phi3VForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3VForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3VForCausalLM.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3VForCausalLM.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3VForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3VForCausalLM.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3VForCausalLM.vision_embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi3VForCausalLM.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 25, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 18, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.phi3v.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.phi3v.Phi3VProcessingInfo", "methods": [ { "kind": "function", "name": "Phi3VProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Phi3VProcessingInfo.get_num_image_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Phi3VProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.phi3v", "names": [ "vllm.model_executor.models.phi3v.CLIP_VIT_LARGE_PATCH14_336_CONFIG", "vllm.model_executor.models.phi3v.Phi3HDImageEmbedding", "vllm.model_executor.models.phi3v.Phi3VDummyInputsBuilder", "vllm.model_executor.models.phi3v.Phi3VForCausalLM", "vllm.model_executor.models.phi3v.Phi3VImageEmbeddingInputs", "vllm.model_executor.models.phi3v.Phi3VImageInputs", "vllm.model_executor.models.phi3v.Phi3VImagePixelInputs", "vllm.model_executor.models.phi3v.Phi3VMultiModalProcessor", "vllm.model_executor.models.phi3v.Phi3VProcessingInfo", "vllm.model_executor.models.phi3v.logger" ], "n_typable": 101, "n_typed": 70, "n_any": 0, "n_untyped": 31, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 25, "n_method_overloads": 25, "n_method_params": 50, "n_classes": 7, "n_attrs": 26, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/phi4mm.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.phi4mm.Phi4MMProcessingInfo", "methods": [ { "kind": "function", "name": "Phi4MMProcessingInfo.get_dynamic_hd", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi4MMProcessingInfo.get_feature_extractor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi4MMProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Phi4MMProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Phi4MMProcessingInfo._find_target_aspect_ratio", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Phi4MMProcessingInfo._compute_num_image_tokens", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Phi4MMProcessingInfo.get_num_image_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Phi4MMProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Phi4MMProcessingInfo.get_audio_num_frames", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Phi4MMProcessingInfo._compute_audio_embed_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Phi4MMProcessingInfo.image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Phi4MMProcessingInfo.audio_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 31, "n_typed": 28, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 19, "n_attrs": 0, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm.Phi4MMAudioEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Phi4MMAudioEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMAudioEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.phi4mm.VISION_ENCODER_TO_PROCESSING_CONFIG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.phi4mm.SIGLIP_NAME", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm.Phi4MMAudioFeatureInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Phi4MMAudioFeatureInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMAudioFeatureInputs.audio_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm.Phi4MMMultiModalProcessor", "methods": [ { "kind": "function", "name": "Phi4MMMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Phi4MMMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Phi4MMMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Phi4MMMultiModalProcessor._recompute_cached_prompt_update", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 15, "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm.Phi4MMImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Phi4MMImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImagePixelInputs.image_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImagePixelInputs.num_img_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImagePixelInputs.image_attention_mask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm.Phi4MMImageEncoder", "methods": [ { "kind": "function", "name": "Phi4MMImageEncoder.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Phi4MMImageEncoder.get_img_features", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Phi4MMImageEncoder.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Phi4MMImageEncoder.img_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.num_img_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.base_feat_height_target", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.image_dim_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.img_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.image_attention_mask", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.use_hd_transform", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.with_learnable_separator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.hd_transform_order", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.freeze_img_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.crop_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.image_token_compression_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.image_token_compression", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.base_feat_height_reduction", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.glb_GN", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.sub_GN", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.img_projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.img_features", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.use_out_place_operations", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.type_feature", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMImageEncoder.img_processor_padding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 11, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 23, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm.Phi4MMDummyInputsBuilder", "methods": [ { "kind": "function", "name": "Phi4MMDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi4MMDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.phi4mm.Phi4MMAudioInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.models.phi4mm.get_navit_vision_model", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm.Phi4MMForCausalLM", "methods": [ { "kind": "function", "name": "Phi4MMForCausalLM.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Phi4MMForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Phi4MMForCausalLM._parse_and_validate_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi4MMForCausalLM._process_audio_input", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Phi4MMForCausalLM._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi4MMForCausalLM._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi4MMForCausalLM._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi4MMForCausalLM.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi4MMForCausalLM.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Phi4MMForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi4MMForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi4MMForCausalLM.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Phi4MMForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Phi4MMForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMForCausalLM.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMForCausalLM.vision_encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMForCausalLM.embed_tokens_extend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MMForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 39, "n_typed": 29, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 18, "n_attrs": 10, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.phi4mm.cat_with_pad", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.models.phi4mm", "names": [ "vllm.model_executor.models.phi4mm.Phi4MMAudioEmbeddingInputs", "vllm.model_executor.models.phi4mm.Phi4MMAudioFeatureInputs", "vllm.model_executor.models.phi4mm.Phi4MMAudioInputs", "vllm.model_executor.models.phi4mm.Phi4MMDummyInputsBuilder", "vllm.model_executor.models.phi4mm.Phi4MMForCausalLM", "vllm.model_executor.models.phi4mm.Phi4MMImageEncoder", "vllm.model_executor.models.phi4mm.Phi4MMImagePixelInputs", "vllm.model_executor.models.phi4mm.Phi4MMMultiModalProcessor", "vllm.model_executor.models.phi4mm.Phi4MMProcessingInfo", "vllm.model_executor.models.phi4mm.SIGLIP_NAME", "vllm.model_executor.models.phi4mm.VISION_ENCODER_TO_PROCESSING_CONFIG", "vllm.model_executor.models.phi4mm.cat_with_pad", "vllm.model_executor.models.phi4mm.get_navit_vision_model" ], "n_typable": 143, "n_typed": 100, "n_any": 0, "n_untyped": 43, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 5, "n_methods": 31, "n_method_overloads": 31, "n_method_params": 61, "n_classes": 8, "n_attrs": 45, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/phi4mm_audio.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.phi4mm_audio.ConformerEncoder", "methods": [ { "kind": "function", "name": "ConformerEncoder.__init__", "n_typed": 39, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 39, "n_params": 38, "n_function_overloads": 1, "n_function_params": 38 }, { "kind": "function", "name": "ConformerEncoder.init_relative_attention_bias", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConformerEncoder.calculate_hs_mask", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ConformerEncoder.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ConformerEncoder.extra_multi_layer_output_idxs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ConformerEncoder.num_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerEncoder.num_lang", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerEncoder.kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerEncoder.replication_pad_for_subsample_embedding", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ConformerEncoder.num_heads_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerEncoder.encoders", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerEncoder.extra_layer_output_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 56, "n_typed": 50, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 44, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_audio.WindowQformer", "methods": [ { "kind": "function", "name": "WindowQformer.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "WindowQformer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WindowQformer.decoders", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WindowQformer.queries", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WindowQformer.after_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WindowQformer.window_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_audio.TransformerEncoderBase", "methods": [ { "kind": "function", "name": "TransformerEncoderBase.__init__", "n_typed": 18, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 }, { "kind": "function", "name": "TransformerEncoderBase.compute_lens_change", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TransformerEncoderBase.forward", "n_typed": 0, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TransformerEncoderBase._chunk_size_selection", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TransformerEncoderBase._get_embed_class", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TransformerEncoderBase._forward_embeddings_core", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TransformerEncoderBase._position_embedding", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TransformerEncoderBase._streaming_mask", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "TransformerEncoderBase.forward_embeddings", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "TransformerEncoderBase.get_offset", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TransformerEncoderBase.input_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerEncoderBase.input_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerEncoderBase.chunk_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerEncoderBase.left_chunk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerEncoderBase.attention_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerEncoderBase.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerEncoderBase.attention_group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerEncoderBase.time_reduction", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerEncoderBase.nemo_conv_settings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerEncoderBase.encoder_embedding_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerEncoderBase.pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerEncoderBase.relative_attention_bias_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerEncoderBase.encoder_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerEncoderBase.embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerEncoderBase.relative_attention_bias_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 57, "n_typed": 41, "n_any": 1, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 32, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_audio.ConformerEncoderLayer", "methods": [ { "kind": "function", "name": "ConformerEncoderLayer.__init__", "n_typed": 25, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 25, "n_params": 24, "n_function_overloads": 1, "n_function_params": 24 }, { "kind": "function", "name": "ConformerEncoderLayer.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ConformerEncoderLayer.feed_forward_in", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerEncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerEncoderLayer.conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerEncoderLayer.feed_forward_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerEncoderLayer.layer_norm_att", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConformerEncoderLayer.layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 37, "n_typed": 31, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 29, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_audio.AudioEmbedding", "methods": [ { "kind": "function", "name": "AudioEmbedding.__init__", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AudioEmbedding.set_audio_embeds", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioEmbedding.set_audio_embed_sizes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioEmbedding.get_audio_features", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AudioEmbedding.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AudioEmbedding.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioEmbedding.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioEmbedding.audio_dim_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioEmbedding.audio_dim_in", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioEmbedding.freeze_audio_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioEmbedding.downsample_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioEmbedding.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioEmbedding.input_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioEmbedding.audio_embed_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioEmbedding.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioEmbedding.qformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioEmbedding.conv_ds", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioEmbedding.audio_projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioEmbedding.linear_downsample_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioEmbedding.audio_projection_for_vision", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 14, "n_any": 1, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 15, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.phi4mm_audio", "names": [ "vllm.model_executor.models.phi4mm_audio.AudioEmbedding", "vllm.model_executor.models.phi4mm_audio.ConformerEncoder", "vllm.model_executor.models.phi4mm_audio.ConformerEncoderLayer", "vllm.model_executor.models.phi4mm_audio.TransformerEncoderBase", "vllm.model_executor.models.phi4mm_audio.WindowQformer" ], "n_typable": 197, "n_typed": 148, "n_any": 2, "n_untyped": 47, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 23, "n_method_overloads": 23, "n_method_params": 126, "n_classes": 5, "n_attrs": 48, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/phi4mm_utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.NemoConvSubsampling", "methods": [ { "kind": "function", "name": "NemoConvSubsampling.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "NemoConvSubsampling.get_sampling_frames", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NemoConvSubsampling.get_streaming_cache_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NemoConvSubsampling.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NemoConvSubsampling.reset_parameters", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NemoConvSubsampling.conv_split_by_batch", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemoConvSubsampling.conv_split_by_channel", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NemoConvSubsampling.channel_chunked_conv", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "NemoConvSubsampling.change_subsampling_conv_chunking_factor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemoConvSubsampling.subsampling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemoConvSubsampling.is_causal", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemoConvSubsampling.subsampling_causal_cond", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemoConvSubsampling.subsampling_conv_chunking_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemoConvSubsampling.conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemoConvSubsampling.out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemoConvSubsampling.conv2d_subsampling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 25, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 16, "n_attrs": 7, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.phi4mm_utils.calc_length", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.DepthWiseSeperableConv1d", "methods": [ { "kind": "function", "name": "DepthWiseSeperableConv1d.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DepthWiseSeperableConv1d.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DepthWiseSeperableConv1d.dw_conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DepthWiseSeperableConv1d.depthwise_seperable_out_channel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DepthWiseSeperableConv1d.pw_conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.phi4mm_utils.adaptive_enc_mask", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.ConvModule", "methods": [ { "kind": "function", "name": "ConvModule.__init__", "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "ConvModule._add_ext_pw_layer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConvModule.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ConvModule.layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.input_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.ext_pw_out_channel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.ext_pw_kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.depthwise_seperable_out_channel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.glu_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.bias_in_glu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.linear_glu_in_convm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.causal", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.batch_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.export", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.dw_sep_conv_1d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.bn_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ConvModule.ln2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 37, "n_typed": 20, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 17, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.GLU", "methods": [ { "kind": "function", "name": "GLU.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GLU.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GLU.dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLU.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.phi4mm_utils.masked_softmax", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.MeanVarianceNormLayer", "methods": [ { "kind": "function", "name": "MeanVarianceNormLayer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MeanVarianceNormLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MeanVarianceNormLayer.input_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MeanVarianceNormLayer.global_mean", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MeanVarianceNormLayer.global_invstd", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 4, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.T5RelativeAttentionLogitBias", "methods": [ { "kind": "function", "name": "T5RelativeAttentionLogitBias.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "T5RelativeAttentionLogitBias.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "T5RelativeAttentionLogitBias._bucket_relative_position", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "T5RelativeAttentionLogitBias.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "T5RelativeAttentionLogitBias.num_buckets", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "T5RelativeAttentionLogitBias.max_distance", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "T5RelativeAttentionLogitBias.symmetric", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "T5RelativeAttentionLogitBias.bias_values", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.phi4mm_utils.unfold_tensor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.phi4mm_utils.get_activation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.GLUPointWiseConv", "methods": [ { "kind": "function", "name": "GLUPointWiseConv.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "GLUPointWiseConv.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GLUPointWiseConv.glu_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLUPointWiseConv.output_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLUPointWiseConv.bias_in_glu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLUPointWiseConv.glu_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLUPointWiseConv.ext_pw_conv_1d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLUPointWiseConv.b1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLUPointWiseConv.b2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 9, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.GLULinear", "methods": [ { "kind": "function", "name": "GLULinear.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GLULinear.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GLULinear.linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GLULinear.glu_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.MultiHeadedAttention", "methods": [ { "kind": "function", "name": "MultiHeadedAttention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "MultiHeadedAttention.forward", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiHeadedAttention.inv_sqrt_d_k", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.h", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.h_k", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.g", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.d_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.linear_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.linear_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.linear_v", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.linear_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.dropout_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.use_pt_scaled_dot_product_attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.quant_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.quant_x", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.dequant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiHeadedAttention.ffunc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 22, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 16, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.MultiSequential", "methods": [ { "kind": "function", "name": "MultiSequential.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.BlockBase", "methods": [ { "kind": "function", "name": "BlockBase.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlockBase.input_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockBase.output_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.AttBlock", "methods": [ { "kind": "function", "name": "AttBlock.memory_dims", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.phi4mm_utils.get_offset", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.FeedForward", "methods": [ { "kind": "function", "name": "FeedForward.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FeedForward.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FeedForward.d_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FeedForward.d_inner", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FeedForward.layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FeedForward.net", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.CausalConv2D", "methods": [ { "kind": "function", "name": "CausalConv2D.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "CausalConv2D.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 14, "n_typed": 12, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.AbsolutePositionalEncoding", "methods": [ { "kind": "function", "name": "AbsolutePositionalEncoding.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AbsolutePositionalEncoding.extend_pe", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AbsolutePositionalEncoding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AbsolutePositionalEncoding.d_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AbsolutePositionalEncoding.xscale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AbsolutePositionalEncoding.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AbsolutePositionalEncoding.pe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.CausalConv1D", "methods": [ { "kind": "function", "name": "CausalConv1D.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "CausalConv1D.update_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CausalConv1D.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CausalConv1D.cache_drop_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 16, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 15, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phi4mm_utils.AttModule", "methods": [ { "kind": "function", "name": "AttModule.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttModule.set_export", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttModule.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AttModule.export_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.phi4mm_utils", "names": [ "vllm.model_executor.models.phi4mm_utils.AbsolutePositionalEncoding", "vllm.model_executor.models.phi4mm_utils.AttBlock", "vllm.model_executor.models.phi4mm_utils.AttModule", "vllm.model_executor.models.phi4mm_utils.BlockBase", "vllm.model_executor.models.phi4mm_utils.CausalConv1D", "vllm.model_executor.models.phi4mm_utils.CausalConv2D", "vllm.model_executor.models.phi4mm_utils.ConvModule", "vllm.model_executor.models.phi4mm_utils.DepthWiseSeperableConv1d", "vllm.model_executor.models.phi4mm_utils.FeedForward", "vllm.model_executor.models.phi4mm_utils.GLU", "vllm.model_executor.models.phi4mm_utils.GLULinear", "vllm.model_executor.models.phi4mm_utils.GLUPointWiseConv", "vllm.model_executor.models.phi4mm_utils.MeanVarianceNormLayer", "vllm.model_executor.models.phi4mm_utils.MultiHeadedAttention", "vllm.model_executor.models.phi4mm_utils.MultiSequential", "vllm.model_executor.models.phi4mm_utils.NemoConvSubsampling", "vllm.model_executor.models.phi4mm_utils.T5RelativeAttentionLogitBias", "vllm.model_executor.models.phi4mm_utils.adaptive_enc_mask", "vllm.model_executor.models.phi4mm_utils.calc_length", "vllm.model_executor.models.phi4mm_utils.get_activation", "vllm.model_executor.models.phi4mm_utils.get_offset", "vllm.model_executor.models.phi4mm_utils.masked_softmax", "vllm.model_executor.models.phi4mm_utils.unfold_tensor" ], "n_typable": 266, "n_typed": 190, "n_any": 0, "n_untyped": 76, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 17, "n_methods": 43, "n_method_overloads": 43, "n_method_params": 125, "n_classes": 17, "n_attrs": 75, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/phimoe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.phimoe.PhiMoEModel", "methods": [ { "kind": "function", "name": "PhiMoEModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PhiMoEModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PhiMoEModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PhiMoEModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PhiMoEModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PhiMoEModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 12, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phimoe.PhiMoEDecoderLayer", "methods": [ { "kind": "function", "name": "PhiMoEDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PhiMoEDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PhiMoEDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEDecoderLayer.block_sparse_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phimoe.mp", "methods": [ { "kind": "function", "name": "mp.forward", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "mp.backward", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phimoe.PhiMoE", "methods": [ { "kind": "function", "name": "PhiMoE.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "PhiMoE.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PhiMoE.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoE.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoE.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 10, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.phimoe.PhiMoEAttention", "methods": [ { "kind": "function", "name": "PhiMoEAttention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "PhiMoEAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PhiMoEAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 13, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 13, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.phimoe.sparsemixer", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.phimoe.PhiMoEForCausalLM", "methods": [ { "kind": "function", "name": "PhiMoEForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PhiMoEForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PhiMoEForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PhiMoEForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PhiMoEForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PhiMoEForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PhiMoEForCausalLM.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PhiMoEForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PhiMoEForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PhiMoEForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 14, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_attrs": 9, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.phimoe.phimoe_routing_function", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.phimoe.PhiMoEConfig", "methods": [ { "kind": "function", "name": "PhiMoEConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 28, "n_overloads": 1, "n_typable": 28, "n_params": 27, "n_function_overloads": 1, "n_function_params": 27 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PhiMoEConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PhiMoEConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PhiMoEConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.attention_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.lm_head_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.num_experts_per_tok", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.num_local_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.output_router_logits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.router_aux_loss_coef", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PhiMoEConfig.router_jitter_noise", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 49, "n_typed": 0, "n_any": 0, "n_untyped": 49, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 27, "n_attrs": 23, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.phimoe", "names": [ "vllm.model_executor.models.phimoe.PhiMoE", "vllm.model_executor.models.phimoe.PhiMoEAttention", "vllm.model_executor.models.phimoe.PhiMoEConfig", "vllm.model_executor.models.phimoe.PhiMoEDecoderLayer", "vllm.model_executor.models.phimoe.PhiMoEForCausalLM", "vllm.model_executor.models.phimoe.PhiMoEModel", "vllm.model_executor.models.phimoe.mp", "vllm.model_executor.models.phimoe.phimoe_routing_function", "vllm.model_executor.models.phimoe.sparsemixer" ], "n_typable": 161, "n_typed": 68, "n_any": 0, "n_untyped": 93, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 6, "n_methods": 20, "n_method_overloads": 20, "n_method_params": 79, "n_classes": 7, "n_attrs": 59, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/pixtral.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.pixtral.position_meshgrid", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.pixtral.get_sub_grids", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.Transformer", "methods": [ { "kind": "function", "name": "Transformer.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Transformer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Transformer.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.pixtral.PATCH_MERGE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.PixtralHFMLP", "methods": [ { "kind": "function", "name": "PixtralHFMLP.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PixtralHFMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PixtralHFMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFMLP.act_and_mul", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 6, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.TransformerBlock", "methods": [ { "kind": "function", "name": "TransformerBlock.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TransformerBlock.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TransformerBlock.attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerBlock.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerBlock.attention_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerBlock.ffn_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.VisionTransformer", "methods": [ { "kind": "function", "name": "VisionTransformer.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VisionTransformer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "VisionTransformer.max_patches_per_side", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VisionTransformer.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VisionTransformer.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VisionTransformer.freqs_cis", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "VisionTransformer.args", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.patch_conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.ln_pre", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 4, "n_properties": 4 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.PixtralProcessingInfo", "methods": [ { "kind": "function", "name": "PixtralProcessingInfo.get_tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PixtralProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PixtralProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PixtralProcessingInfo.get_num_image_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PixtralProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.VisionLanguageAdapter", "methods": [ { "kind": "function", "name": "VisionLanguageAdapter.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VisionLanguageAdapter.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VisionLanguageAdapter.w_in", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionLanguageAdapter.gelu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionLanguageAdapter.w_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 4, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.PixtralMultiModalProcessor", "methods": [ { "kind": "function", "name": "PixtralMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PixtralMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PixtralMultiModalProcessor._cached_apply_hf_processor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.PixtralForConditionalGeneration", "methods": [ { "kind": "function", "name": "PixtralForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PixtralForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PixtralForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PixtralForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PixtralForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PixtralForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PixtralForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PixtralForConditionalGeneration.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PixtralForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PixtralForConditionalGeneration.get_num_mm_encoder_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PixtralForConditionalGeneration.get_num_mm_connector_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PixtralForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralForConditionalGeneration.vision_args", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralForConditionalGeneration.vision_encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralForConditionalGeneration.pre_mm_projector_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralForConditionalGeneration.patch_merger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralForConditionalGeneration.vision_language_adapter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 36, "n_typed": 25, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 16, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.PixtralImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PixtralImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PixtralImagePixelInputs.images", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.PixtralProcessorAdapter", "methods": [ { "kind": "function", "name": "PixtralProcessorAdapter.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PixtralProcessorAdapter.__call__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "PixtralProcessorAdapter.image_processor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PixtralProcessorAdapter.image_break_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PixtralProcessorAdapter.image_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PixtralProcessorAdapter.image_end_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PixtralProcessorAdapter.image_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PixtralProcessorAdapter.patch_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "PixtralProcessorAdapter.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 12, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 1, "n_properties": 6 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.PixtralDummyInputsBuilder", "methods": [ { "kind": "function", "name": "PixtralDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PixtralDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PixtralDummyInputsBuilder.get_dummy_processor_inputs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.Attention", "methods": [ { "kind": "function", "name": "Attention.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Attention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Attention.args", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.n_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.wq", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.wk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.wv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Attention.wo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 5, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.pixtral.USE_XFORMERS_OPS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.VisionEncoderArgs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "VisionEncoderArgs.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionEncoderArgs.num_channels", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionEncoderArgs.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionEncoderArgs.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionEncoderArgs.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionEncoderArgs.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionEncoderArgs.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionEncoderArgs.rope_theta", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionEncoderArgs.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionEncoderArgs.adapter_bias", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionEncoderArgs.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionEncoderArgs.add_pre_mm_projector_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionEncoderArgs.mm_projector_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.PixtralHFVisionModel", "methods": [ { "kind": "function", "name": "PixtralHFVisionModel.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PixtralHFVisionModel.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PixtralHFVisionModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PixtralHFVisionModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFVisionModel.patch_conv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFVisionModel.ln_pre", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFVisionModel.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFVisionModel.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFVisionModel.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFVisionModel.patch_positional_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 12, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.PatchMerger", "methods": [ { "kind": "function", "name": "PatchMerger.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PatchMerger.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PatchMerger.permute", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PatchMerger.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PatchMerger.mlp_input_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PatchMerger.merging_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 10, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.PixtralHFEncoderInfo", "methods": [ { "kind": "function", "name": "PixtralHFEncoderInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PixtralHFEncoderInfo.get_image_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PixtralHFEncoderInfo.get_patch_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PixtralHFEncoderInfo.get_patch_grid_length", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PixtralHFEncoderInfo.get_patch_grid_size", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.FeedForward", "methods": [ { "kind": "function", "name": "FeedForward.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FeedForward.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FeedForward.w1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FeedForward.w2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FeedForward.w3", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 3, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.pixtral.precompute_freqs_cis_2d", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.PixtralHFTransformer", "methods": [ { "kind": "function", "name": "PixtralHFTransformer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PixtralHFTransformer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PixtralHFTransformer.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.PixtralHFAttention", "methods": [ { "kind": "function", "name": "PixtralHFAttention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PixtralHFAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PixtralHFAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFAttention.n_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 8, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.pixtral.PixtralHFTransformerBlock", "methods": [ { "kind": "function", "name": "PixtralHFTransformerBlock.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PixtralHFTransformerBlock.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PixtralHFTransformerBlock.attention_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFTransformerBlock.attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFTransformerBlock.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixtralHFTransformerBlock.ffn_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.pixtral.apply_rotary_emb_vit", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.models.pixtral", "names": [ "vllm.model_executor.models.pixtral.Attention", "vllm.model_executor.models.pixtral.FeedForward", "vllm.model_executor.models.pixtral.PATCH_MERGE", "vllm.model_executor.models.pixtral.PatchMerger", "vllm.model_executor.models.pixtral.PixtralDummyInputsBuilder", "vllm.model_executor.models.pixtral.PixtralForConditionalGeneration", "vllm.model_executor.models.pixtral.PixtralHFAttention", "vllm.model_executor.models.pixtral.PixtralHFEncoderInfo", "vllm.model_executor.models.pixtral.PixtralHFMLP", "vllm.model_executor.models.pixtral.PixtralHFTransformer", "vllm.model_executor.models.pixtral.PixtralHFTransformerBlock", "vllm.model_executor.models.pixtral.PixtralHFVisionModel", "vllm.model_executor.models.pixtral.PixtralImagePixelInputs", "vllm.model_executor.models.pixtral.PixtralMultiModalProcessor", "vllm.model_executor.models.pixtral.PixtralProcessingInfo", "vllm.model_executor.models.pixtral.PixtralProcessorAdapter", "vllm.model_executor.models.pixtral.Transformer", "vllm.model_executor.models.pixtral.TransformerBlock", "vllm.model_executor.models.pixtral.USE_XFORMERS_OPS", "vllm.model_executor.models.pixtral.VisionEncoderArgs", "vllm.model_executor.models.pixtral.VisionLanguageAdapter", "vllm.model_executor.models.pixtral.VisionTransformer", "vllm.model_executor.models.pixtral.apply_rotary_emb_vit", "vllm.model_executor.models.pixtral.get_sub_grids", "vllm.model_executor.models.pixtral.position_meshgrid", "vllm.model_executor.models.pixtral.precompute_freqs_cis_2d" ], "n_typable": 240, "n_typed": 174, "n_any": 0, "n_untyped": 66, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 11, "n_methods": 55, "n_method_overloads": 55, "n_method_params": 101, "n_classes": 20, "n_attrs": 74, "n_properties": 10, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/plamo2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.plamo2.Plamo2DecoderLayer", "methods": [ { "kind": "function", "name": "Plamo2DecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Plamo2DecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Plamo2DecoderLayer.is_mamba", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2DecoderLayer.pre_mixer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2DecoderLayer.post_mixer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2DecoderLayer.pre_mlp_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2DecoderLayer.post_mlp_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2DecoderLayer.mixer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 7, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.plamo2.plamo2_mamba_mixer_fake", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.models.plamo2.DenseMLP", "methods": [ { "kind": "function", "name": "DenseMLP.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DenseMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DenseMLP.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DenseMLP.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DenseMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DenseMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DenseMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.plamo2.Plamo2Decoder", "methods": [ { "kind": "function", "name": "Plamo2Decoder.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Plamo2Decoder.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.plamo2.Plamo2Model", "methods": [ { "kind": "function", "name": "Plamo2Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Plamo2Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Plamo2Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Plamo2Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Model.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 9, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.plamo2.plamo2_mamba_mixer", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.models.plamo2.Plamo2MambaMixer", "methods": [ { "kind": "function", "name": "Plamo2MambaMixer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Plamo2MambaMixer._project_ssm_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Plamo2MambaMixer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Plamo2MambaMixer.forward_impl", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Plamo2MambaMixer.get_state_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Plamo2MambaMixer.get_state_shape", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "Plamo2MambaMixer.mamba_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Plamo2MambaMixer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.is_lora_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.ssm_state_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.conv_kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.time_step_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.conv1d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.in_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.bcdt_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.dt_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.A", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.D", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.dt_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.dt_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.B_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.C_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.chunk_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.kv_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2MambaMixer.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 45, "n_typed": 10, "n_any": 0, "n_untyped": 35, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 10, "n_attrs": 28, "n_properties": 1 }, { "kind": "function", "name": "vllm.model_executor.models.plamo2.is_mamba", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.plamo2.Plamo2AttentionMixer", "methods": [ { "kind": "function", "name": "Plamo2AttentionMixer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Plamo2AttentionMixer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Plamo2AttentionMixer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2AttentionMixer.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2AttentionMixer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2AttentionMixer.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2AttentionMixer.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2AttentionMixer.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2AttentionMixer.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2AttentionMixer.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2AttentionMixer.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2AttentionMixer.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2AttentionMixer.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2AttentionMixer.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2AttentionMixer.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2AttentionMixer.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2AttentionMixer.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 6, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.plamo2.Plamo2Config", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Plamo2Config.model_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Config.hidden_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Config.num_hidden_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Config.rms_norm_eps", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Config.num_attention_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Config.hidden_size_per_head", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Config.num_key_value_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Config.mamba_d_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Config.mamba_d_conv", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Config.mamba_num_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Config.mamba_step", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Config.intermediate_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2Config.vocab_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 13, "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.plamo2.Plamo2ForCausalLM", "methods": [ { "kind": "function", "name": "Plamo2ForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Plamo2ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Plamo2ForCausalLM.forward", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Plamo2ForCausalLM.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Plamo2ForCausalLM.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Plamo2ForCausalLM.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Plamo2ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Plamo2ForCausalLM.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Plamo2ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Plamo2ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2ForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2ForCausalLM.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2ForCausalLM.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2ForCausalLM.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo2ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 17, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 12, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": null } ], "name": "vllm.model_executor.models.plamo2", "names": [ "vllm.model_executor.models.plamo2.DenseMLP", "vllm.model_executor.models.plamo2.Plamo2AttentionMixer", "vllm.model_executor.models.plamo2.Plamo2Config", "vllm.model_executor.models.plamo2.Plamo2Decoder", "vllm.model_executor.models.plamo2.Plamo2DecoderLayer", "vllm.model_executor.models.plamo2.Plamo2ForCausalLM", "vllm.model_executor.models.plamo2.Plamo2MambaMixer", "vllm.model_executor.models.plamo2.Plamo2Model", "vllm.model_executor.models.plamo2.is_mamba", "vllm.model_executor.models.plamo2.plamo2_mamba_mixer", "vllm.model_executor.models.plamo2.plamo2_mamba_mixer_fake" ], "n_typable": 172, "n_typed": 86, "n_any": 0, "n_untyped": 86, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 8, "n_methods": 25, "n_method_overloads": 25, "n_method_params": 52, "n_classes": 8, "n_attrs": 84, "n_properties": 1, "n_type_ignores": 1 }, { "path": "vllm/model_executor/models/plamo3.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.plamo3.Plamo3Decoder", "methods": [ { "kind": "function", "name": "Plamo3Decoder.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Plamo3Decoder.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.plamo3.DenseMLP", "methods": [ { "kind": "function", "name": "DenseMLP.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DenseMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DenseMLP.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DenseMLP.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DenseMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DenseMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DenseMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.plamo3.Plamo3DecoderLayer", "methods": [ { "kind": "function", "name": "Plamo3DecoderLayer.__init__", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Plamo3DecoderLayer.forward", "n_typed": 4, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Plamo3DecoderLayer.mixer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3DecoderLayer.pre_mixer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3DecoderLayer.post_mixer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3DecoderLayer.pre_mlp_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3DecoderLayer.post_mlp_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 7, "n_any": 2, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.plamo3.Plamo3Model", "methods": [ { "kind": "function", "name": "Plamo3Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Plamo3Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Plamo3Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Plamo3Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Model.org_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Model.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 9, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 7, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.plamo3.rms_norm_weight_loader", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.plamo3.Plamo3ForCausalLM", "methods": [ { "kind": "function", "name": "Plamo3ForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Plamo3ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Plamo3ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Plamo3ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Plamo3ForCausalLM.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Plamo3ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Plamo3ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3ForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3ForCausalLM.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3ForCausalLM.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3ForCausalLM.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3ForCausalLM.unpadded_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 13, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.plamo3.Plamo3Config", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Plamo3Config.model_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Config.hidden_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Config.num_hidden_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Config.rms_norm_eps", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Config.num_attention_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Config.head_dim", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Config.num_key_value_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Config.interleaved_sliding_window", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Config.sliding_window_pattern", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Config.rope_parameters", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Config.rope_local_theta", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Config.intermediate_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3Config.vocab_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 13, "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.plamo3.Plamo3AttentionMixer", "methods": [ { "kind": "function", "name": "Plamo3AttentionMixer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Plamo3AttentionMixer.forward", "n_typed": 4, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Plamo3AttentionMixer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3AttentionMixer.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3AttentionMixer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3AttentionMixer.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3AttentionMixer.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3AttentionMixer.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3AttentionMixer.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3AttentionMixer.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3AttentionMixer.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3AttentionMixer.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3AttentionMixer.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3AttentionMixer.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3AttentionMixer.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3AttentionMixer.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Plamo3AttentionMixer.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 7, "n_any": 1, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 15, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": null } ], "name": "vllm.model_executor.models.plamo3", "names": [ "vllm.model_executor.models.plamo3.DenseMLP", "vllm.model_executor.models.plamo3.Plamo3AttentionMixer", "vllm.model_executor.models.plamo3.Plamo3Config", "vllm.model_executor.models.plamo3.Plamo3Decoder", "vllm.model_executor.models.plamo3.Plamo3DecoderLayer", "vllm.model_executor.models.plamo3.Plamo3ForCausalLM", "vllm.model_executor.models.plamo3.Plamo3Model", "vllm.model_executor.models.plamo3.rms_norm_weight_loader" ], "n_typable": 113, "n_typed": 64, "n_any": 3, "n_untyped": 46, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 39, "n_classes": 7, "n_attrs": 57, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/model_executor/models/qwen.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.qwen.QWenLMHeadModel", "methods": [ { "kind": "function", "name": "QWenLMHeadModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QWenLMHeadModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QWenLMHeadModel.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen.QWenBlock", "methods": [ { "kind": "function", "name": "QWenBlock.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "QWenBlock.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QWenBlock.ln_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenBlock.ln_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen.QWenModel", "methods": [ { "kind": "function", "name": "QWenModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QWenModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QWenModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QWenModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenModel.wte", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenModel.ln_f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 9, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen.QWenBaseModel", "methods": [ { "kind": "function", "name": "QWenBaseModel.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "QWenBaseModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QWenBaseModel.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QWenBaseModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QWenBaseModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenBaseModel.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenBaseModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenBaseModel.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenBaseModel.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenBaseModel.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenBaseModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 10, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen.QWenAttention", "methods": [ { "kind": "function", "name": "QWenAttention.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "QWenAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QWenAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenAttention.c_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenAttention.c_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 10, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen.QWenMLP", "methods": [ { "kind": "function", "name": "QWenMLP.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "QWenMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QWenMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenMLP.c_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QWenMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen", "names": [ "vllm.model_executor.models.qwen.QWenAttention", "vllm.model_executor.models.qwen.QWenBaseModel", "vllm.model_executor.models.qwen.QWenBlock", "vllm.model_executor.models.qwen.QWenLMHeadModel", "vllm.model_executor.models.qwen.QWenMLP", "vllm.model_executor.models.qwen.QWenModel" ], "n_typable": 84, "n_typed": 51, "n_any": 0, "n_untyped": 33, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 41, "n_classes": 6, "n_attrs": 29, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.qwen2.Qwen2MLP", "methods": [ { "kind": "function", "name": "Qwen2MLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen2MLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2MLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2.Qwen2ForCausalLM", "methods": [ { "kind": "function", "name": "Qwen2ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2ForCausalLM.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2ForCausalLM.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen2ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2ForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 16, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 10, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2.Qwen2DecoderLayer", "methods": [ { "kind": "function", "name": "Qwen2DecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2DecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.qwen2.qwen_2_model_invariants", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2.Qwen2Model", "methods": [ { "kind": "function", "name": "Qwen2Model.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen2Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Model.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Model.aux_hidden_state_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 12, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2.Qwen2Attention", "methods": [ { "kind": "function", "name": "Qwen2Attention.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "Qwen2Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.dual_chunk_attention_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.qk_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2Attention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 16, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 14, "n_attrs": 17, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen2", "names": [ "vllm.model_executor.models.qwen2.Qwen2Attention", "vllm.model_executor.models.qwen2.Qwen2DecoderLayer", "vllm.model_executor.models.qwen2.Qwen2ForCausalLM", "vllm.model_executor.models.qwen2.Qwen2MLP", "vllm.model_executor.models.qwen2.Qwen2Model", "vllm.model_executor.models.qwen2.qwen_2_model_invariants" ], "n_typable": 106, "n_typed": 63, "n_any": 0, "n_untyped": 43, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 46, "n_classes": 5, "n_attrs": 39, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen2_5_omni_thinker.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.qwen2_5_omni_thinker.flash_attn", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_omni_thinker.Qwen2_5OmniAudioFeatureInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2_5OmniAudioFeatureInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5OmniAudioFeatureInputs.input_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5OmniAudioFeatureInputs.audio_feature_lengths", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5OmniAudioFeatureInputs.feature_attention_mask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_omni_thinker.Qwen2_5OmniThinkerProcessingInfo", "methods": [ { "kind": "function", "name": "Qwen2_5OmniThinkerProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2_5OmniThinkerProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5OmniThinkerProcessingInfo.get_feature_extractor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5OmniThinkerProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2_5OmniThinkerProcessingInfo.get_target_channels", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2_5OmniThinkerProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2_5OmniThinkerProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_omni_thinker.Qwen2_5OmniThinkerMultiModalProcessor", "methods": [ { "kind": "function", "name": "Qwen2_5OmniThinkerMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2_5OmniThinkerMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2_5OmniThinkerMultiModalProcessor._derive_audio_from_video_placeholders", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2_5OmniThinkerMultiModalProcessor._maybe_apply_prompt_updates", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen2_5OmniThinkerMultiModalProcessor.omni_get_updates_use_audio_in_video", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2_5OmniThinkerMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen2_5OmniThinkerMultiModalProcessor._apply_hf_processor_main", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen2_5OmniThinkerMultiModalProcessor._apply_hf_processor_mm_only", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 36, "n_typed": 36, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 28, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_omni_thinker.Qwen2_5OmniConditionalGenerationMixin", "methods": [ { "kind": "function", "name": "Qwen2_5OmniConditionalGenerationMixin._parse_and_validate_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5OmniConditionalGenerationMixin._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5OmniConditionalGenerationMixin._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5OmniConditionalGenerationMixin._process_audio_input", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen2_5OmniConditionalGenerationMixin._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5OmniConditionalGenerationMixin._process_video_input", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 10, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.qwen2_5_omni_thinker.merge_interleaved_embeddings", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_omni_thinker.Qwen2_5OmniThinkerMultiModalDataParser", "methods": [ { "kind": "function", "name": "Qwen2_5OmniThinkerMultiModalDataParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen2_5OmniThinkerMultiModalDataParser._parse_audio_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.qwen2_5_omni_thinker.check_interleaved_audio_video", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.models.qwen2_5_omni_thinker.create_qwen2_5_omni_thinker_field_factory", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_omni_thinker.Qwen2_5OmniThinkerForConditionalGeneration", "methods": [ { "kind": "function", "name": "Qwen2_5OmniThinkerForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2_5OmniThinkerForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2_5OmniThinkerForConditionalGeneration._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5OmniThinkerForConditionalGeneration._get_audio_for_video_mapping", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5OmniThinkerForConditionalGeneration._compute_audio_token_count", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5OmniThinkerForConditionalGeneration.iter_mm_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5OmniThinkerForConditionalGeneration._compute_interleaved_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2_5OmniThinkerForConditionalGeneration.get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2_5OmniThinkerForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5OmniThinkerForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2_5OmniThinkerForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen2_5OmniThinkerForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5OmniThinkerForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5OmniThinkerForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2_5OmniThinkerForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5OmniThinkerForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen2_5OmniThinkerForConditionalGeneration.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5OmniThinkerForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5OmniThinkerForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5OmniThinkerForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5OmniThinkerForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5OmniThinkerForConditionalGeneration.audio_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5OmniThinkerForConditionalGeneration.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5OmniThinkerForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 47, "n_typed": 37, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 24, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen2_5_omni_thinker.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_omni_thinker.Qwen2_5OmniThinkerDummyInputsBuilder", "methods": [ { "kind": "function", "name": "Qwen2_5OmniThinkerDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5OmniThinkerDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen2_5_omni_thinker", "names": [ "vllm.model_executor.models.qwen2_5_omni_thinker.Qwen2_5OmniAudioFeatureInputs", "vllm.model_executor.models.qwen2_5_omni_thinker.Qwen2_5OmniConditionalGenerationMixin", "vllm.model_executor.models.qwen2_5_omni_thinker.Qwen2_5OmniThinkerDummyInputsBuilder", "vllm.model_executor.models.qwen2_5_omni_thinker.Qwen2_5OmniThinkerForConditionalGeneration", "vllm.model_executor.models.qwen2_5_omni_thinker.Qwen2_5OmniThinkerMultiModalDataParser", "vllm.model_executor.models.qwen2_5_omni_thinker.Qwen2_5OmniThinkerMultiModalProcessor", "vllm.model_executor.models.qwen2_5_omni_thinker.Qwen2_5OmniThinkerProcessingInfo", "vllm.model_executor.models.qwen2_5_omni_thinker.check_interleaved_audio_video", "vllm.model_executor.models.qwen2_5_omni_thinker.create_qwen2_5_omni_thinker_field_factory", "vllm.model_executor.models.qwen2_5_omni_thinker.flash_attn", "vllm.model_executor.models.qwen2_5_omni_thinker.logger", "vllm.model_executor.models.qwen2_5_omni_thinker.merge_interleaved_embeddings" ], "n_typable": 142, "n_typed": 125, "n_any": 0, "n_untyped": 17, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 12, "n_methods": 39, "n_method_overloads": 39, "n_method_params": 74, "n_classes": 7, "n_attrs": 16, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen2_5_vl.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.qwen2_5_vl.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2_5_VLImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLImageEmbeddingInputs.image_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLImageEmbeddingInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VisionAttention", "methods": [ { "kind": "function", "name": "Qwen2_5_VisionAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen2_5_VisionAttention.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2_5_VisionAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionAttention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionAttention.hidden_size_per_attention_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionAttention.num_attention_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionAttention.qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionAttention.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionAttention.apply_rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 13, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2_5_VLImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLImagePixelInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLVideoPixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2_5_VLVideoPixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLVideoPixelInputs.pixel_values_videos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLVideoPixelInputs.video_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLVideoPixelInputs.second_per_grid_ts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLVideoPixelInputs.timestamps", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLForConditionalGeneration", "methods": [ { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration.iter_mm_grid_thw", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration.get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration._postprocess_image_embeds_evs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration._process_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration._postprocess_video_embeds_evs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration.recompute_mrope_positions", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration.get_num_mm_encoder_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5_VLForConditionalGeneration.get_num_mm_connector_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2_5_VLForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen2_5_VLForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLForConditionalGeneration.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen2_5_VLForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLForConditionalGeneration.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLForConditionalGeneration.video_pruning_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLForConditionalGeneration.is_multimodal_pruning_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLForConditionalGeneration.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 62, "n_typed": 51, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 31, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLVideoEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2_5_VLVideoEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLVideoEmbeddingInputs.video_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLVideoEmbeddingInputs.video_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLVideoEmbeddingInputs.second_per_grid_ts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VLVideoEmbeddingInputs.timestamps", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VisionPatchMerger", "methods": [ { "kind": "function", "name": "Qwen2_5_VisionPatchMerger.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Qwen2_5_VisionPatchMerger.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2_5_VisionPatchMerger.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionPatchMerger.ln_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionPatchMerger.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VisionPatchEmbed", "methods": [ { "kind": "function", "name": "Qwen2_5_VisionPatchEmbed.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2_5_VisionPatchEmbed.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2_5_VisionPatchEmbed.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionPatchEmbed.temporal_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionPatchEmbed.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionPatchEmbed.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLProcessingInfo", "methods": [ { "kind": "function", "name": "Qwen2_5_VLProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2_5_VLProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VisionTransformer", "methods": [ { "kind": "function", "name": "Qwen2_5_VisionTransformer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2_5_VisionTransformer.rotary_pos_emb_thw", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen2_5_VisionTransformer.get_window_index_thw", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen2_5_VisionTransformer.get_rope_by_thw", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen2_5_VisionTransformer.compute_attn_mask_seqlen", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5_VisionTransformer.invert_permutation", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2_5_VisionTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2_5_VisionTransformer.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Qwen2_5_VisionTransformer.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Qwen2_5_VisionTransformer.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Qwen2_5_VisionTransformer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionTransformer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionTransformer.out_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionTransformer.window_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionTransformer.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionTransformer.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionTransformer.fullatt_block_indexes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionTransformer.spatial_merge_unit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionTransformer.rotary_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionTransformer.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionTransformer.patch_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionTransformer.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionTransformer.merger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 41, "n_typed": 16, "n_any": 0, "n_untyped": 25, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 18, "n_attrs": 13, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLMultiModalProcessor", "methods": [ { "kind": "function", "name": "Qwen2_5_VLMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2_5_VLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VisionBlock", "methods": [ { "kind": "function", "name": "Qwen2_5_VisionBlock.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Qwen2_5_VisionBlock.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2_5_VisionBlock.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionBlock.norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 14, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VisionMLP", "methods": [ { "kind": "function", "name": "Qwen2_5_VisionMLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Qwen2_5_VisionMLP.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2_5_VisionMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2_5_VisionMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLVideoInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen2_5_vl", "names": [ "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLForConditionalGeneration", "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLImageEmbeddingInputs", "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLImageInputs", "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLImagePixelInputs", "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLMultiModalProcessor", "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLProcessingInfo", "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLVideoEmbeddingInputs", "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLVideoInputs", "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VLVideoPixelInputs", "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VisionAttention", "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VisionBlock", "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VisionMLP", "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VisionPatchEmbed", "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VisionPatchMerger", "vllm.model_executor.models.qwen2_5_vl.Qwen2_5_VisionTransformer", "vllm.model_executor.models.qwen2_5_vl.logger" ], "n_typable": 206, "n_typed": 144, "n_any": 0, "n_untyped": 62, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 43, "n_method_overloads": 43, "n_method_params": 97, "n_classes": 13, "n_attrs": 66, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen2_audio.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.qwen2_audio.Qwen2AudioMultiModalProcessor", "methods": [ { "kind": "function", "name": "Qwen2AudioMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2AudioMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2AudioMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_audio.Qwen2AudioMultiModalDataParser", "methods": [ { "kind": "function", "name": "Qwen2AudioMultiModalDataParser._parse_audio_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_audio.Qwen2AudioProcessingInfo", "methods": [ { "kind": "function", "name": "Qwen2AudioProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2AudioProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2AudioProcessingInfo.get_feature_extractor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2AudioProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2AudioProcessingInfo.get_target_channels", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2AudioProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2AudioProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen2_audio.Qwen2AudioInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_audio.Qwen2AudioEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2AudioEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2AudioEmbeddingInputs.audio_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_audio.Qwen2AudioDummyInputsBuilder", "methods": [ { "kind": "function", "name": "Qwen2AudioDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2AudioDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_audio.Qwen2AudioMultiModalProjector", "methods": [ { "kind": "function", "name": "Qwen2AudioMultiModalProjector.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2AudioMultiModalProjector.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2AudioMultiModalProjector.linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 2, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_audio.Qwen2AudioFeatureInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2AudioFeatureInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2AudioFeatureInputs.input_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2AudioFeatureInputs.feature_attention_mask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_audio.Qwen2AudioForConditionalGeneration", "methods": [ { "kind": "function", "name": "Qwen2AudioForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2AudioForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2AudioForConditionalGeneration._parse_and_validate_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2AudioForConditionalGeneration._process_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2AudioForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2AudioForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen2AudioForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2AudioForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2AudioForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2AudioForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2AudioForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2AudioForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2AudioForConditionalGeneration.audio_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2AudioForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2AudioForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 21, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 14, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen2_audio", "names": [ "vllm.model_executor.models.qwen2_audio.Qwen2AudioDummyInputsBuilder", "vllm.model_executor.models.qwen2_audio.Qwen2AudioEmbeddingInputs", "vllm.model_executor.models.qwen2_audio.Qwen2AudioFeatureInputs", "vllm.model_executor.models.qwen2_audio.Qwen2AudioForConditionalGeneration", "vllm.model_executor.models.qwen2_audio.Qwen2AudioInputs", "vllm.model_executor.models.qwen2_audio.Qwen2AudioMultiModalDataParser", "vllm.model_executor.models.qwen2_audio.Qwen2AudioMultiModalProcessor", "vllm.model_executor.models.qwen2_audio.Qwen2AudioMultiModalProjector", "vllm.model_executor.models.qwen2_audio.Qwen2AudioProcessingInfo" ], "n_typable": 72, "n_typed": 58, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 23, "n_method_overloads": 23, "n_method_params": 35, "n_classes": 8, "n_attrs": 14, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen2_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.qwen2_moe.Qwen2MoeModel", "methods": [ { "kind": "function", "name": "Qwen2MoeModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2MoeModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2MoeModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2MoeModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2MoeModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2MoeModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 12, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_moe.Qwen2MoeMLP", "methods": [ { "kind": "function", "name": "Qwen2MoeMLP.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Qwen2MoeMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2MoeMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeMLP.expert_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 8, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_moe.Qwen2MoeDecoderLayer", "methods": [ { "kind": "function", "name": "Qwen2MoeDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2MoeDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2MoeDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_moe.Qwen2MoeSparseMoeBlock", "methods": [ { "kind": "function", "name": "Qwen2MoeSparseMoeBlock.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen2MoeSparseMoeBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2MoeSparseMoeBlock.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeSparseMoeBlock.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeSparseMoeBlock.shared_expert_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeSparseMoeBlock.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeSparseMoeBlock.shared_expert", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 5, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen2_moe.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_moe.Qwen2MoeForCausalLM", "methods": [ { "kind": "function", "name": "Qwen2MoeForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2MoeForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2MoeForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2MoeForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2MoeForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2MoeForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2MoeForCausalLM.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen2MoeForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen2MoeForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 14, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_moe.Qwen2MoeAttention", "methods": [ { "kind": "function", "name": "Qwen2MoeAttention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "Qwen2MoeAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2MoeAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeAttention.dual_chunk_attention_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2MoeAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 13, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 15, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen2_moe", "names": [ "vllm.model_executor.models.qwen2_moe.Qwen2MoeAttention", "vllm.model_executor.models.qwen2_moe.Qwen2MoeDecoderLayer", "vllm.model_executor.models.qwen2_moe.Qwen2MoeForCausalLM", "vllm.model_executor.models.qwen2_moe.Qwen2MoeMLP", "vllm.model_executor.models.qwen2_moe.Qwen2MoeModel", "vllm.model_executor.models.qwen2_moe.Qwen2MoeSparseMoeBlock", "vllm.model_executor.models.qwen2_moe.logger" ], "n_typable": 107, "n_typed": 61, "n_any": 0, "n_untyped": 46, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 47, "n_classes": 6, "n_attrs": 43, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen2_rm.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.qwen2_rm.Qwen2RewardBaseModel", "methods": [ { "kind": "function", "name": "Qwen2RewardBaseModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2RewardBaseModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2RewardBaseModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2RewardBaseModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2RewardBaseModel.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen2RewardBaseModel.pooler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2RewardBaseModel.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen2RewardBaseModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2RewardBaseModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2RewardBaseModel.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2RewardBaseModel.head_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2RewardBaseModel.score", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2RewardBaseModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 12, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_rm.Qwen2ForProcessRewardModel", "methods": [ { "kind": "function", "name": "Qwen2ForProcessRewardModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_rm.Qwen2ForRewardModel", "methods": [ { "kind": "function", "name": "Qwen2ForRewardModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen2_rm", "names": [ "vllm.model_executor.models.qwen2_rm.Qwen2ForProcessRewardModel", "vllm.model_executor.models.qwen2_rm.Qwen2ForRewardModel", "vllm.model_executor.models.qwen2_rm.Qwen2RewardBaseModel" ], "n_typable": 25, "n_typed": 16, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_classes": 3, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen2_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VLMultiModalDataParser", "methods": [ { "kind": "function", "name": "Qwen2VLMultiModalDataParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen2VLMultiModalDataParser._parse_image_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VLMultiModalDataParser._parse_video_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Tarsier2Processor", "methods": [ { "kind": "function", "name": "Tarsier2Processor.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VLVideoPixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2VLVideoPixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VLVideoPixelInputs.pixel_values_videos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VLVideoPixelInputs.video_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VLForConditionalGeneration", "methods": [ { "kind": "function", "name": "Qwen2VLForConditionalGeneration.iter_mm_grid_thw", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VLForConditionalGeneration.get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2VLForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2VLForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2VLForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VLForConditionalGeneration._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VLForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VLForConditionalGeneration._process_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VLForConditionalGeneration._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VLForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VLForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen2VLForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VLForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VLForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2VLForConditionalGeneration.get_num_mm_encoder_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VLForConditionalGeneration.get_num_mm_connector_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2VLForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VLForConditionalGeneration.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen2VLForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VLForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VLForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VLForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VLForConditionalGeneration.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VLForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 45, "n_typed": 37, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 22, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Tarsier2ProcessingInfo", "methods": [ { "kind": "function", "name": "Tarsier2ProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Tarsier2ProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Tarsier2ProcessingInfo.get_image_processor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Tarsier2MultiModalProcessor", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VLImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2VLImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VLImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VLImagePixelInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VisionMLP", "methods": [ { "kind": "function", "name": "Qwen2VisionMLP.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen2VisionMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2VisionMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionMLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VLMultiModalProcessor", "methods": [ { "kind": "function", "name": "Qwen2VLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen2VLMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VLImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2VLImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VLImageEmbeddingInputs.image_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VLImageEmbeddingInputs.image_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VisionTransformer", "methods": [ { "kind": "function", "name": "Qwen2VisionTransformer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2VisionTransformer.rot_pos_emb", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VisionTransformer.compute_attn_mask_seqlen", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VisionTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2VisionTransformer.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Qwen2VisionTransformer.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Qwen2VisionTransformer.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Qwen2VisionTransformer.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionTransformer.out_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionTransformer.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionTransformer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionTransformer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionTransformer.patch_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionTransformer.rotary_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionTransformer.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionTransformer.merger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionTransformer.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 16, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 10, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VLVideoEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2VLVideoEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VLVideoEmbeddingInputs.video_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VLVideoEmbeddingInputs.video_grid_thw", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VLDummyInputsBuilder", "methods": [ { "kind": "function", "name": "Qwen2VLDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VLDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VisionAttention", "methods": [ { "kind": "function", "name": "Qwen2VisionAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen2VisionAttention.split_qkv", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VisionAttention.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2VisionAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionAttention.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionAttention.hidden_size_per_attention_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionAttention.num_attention_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionAttention.qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionAttention.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionAttention.apply_rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 14, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VisionPatchMerger", "methods": [ { "kind": "function", "name": "Qwen2VisionPatchMerger.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Qwen2VisionPatchMerger.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2VisionPatchMerger.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionPatchMerger.ln_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionPatchMerger.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VisionPatchEmbed", "methods": [ { "kind": "function", "name": "Qwen2VisionPatchEmbed.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2VisionPatchEmbed.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2VisionPatchEmbed.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionPatchEmbed.temporal_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionPatchEmbed.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionPatchEmbed.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VLImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VLVideoInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Tarsier2ImageProcessor", "methods": [ { "kind": "function", "name": "Tarsier2ImageProcessor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Tarsier2ForConditionalGeneration", "methods": [ { "kind": "function", "name": "Tarsier2ForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Tarsier2ForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VisionBlock", "methods": [ { "kind": "function", "name": "Qwen2VisionBlock.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Qwen2VisionBlock.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen2VisionBlock.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionBlock.norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen2VisionBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 14, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen2_vl.Qwen2VLProcessingInfo", "methods": [ { "kind": "function", "name": "Qwen2VLProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2VLProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VLProcessingInfo.get_image_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VLProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2VLProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2VLProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2VLProcessingInfo._get_vision_info", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Qwen2VLProcessingInfo.get_num_image_tokens", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen2VLProcessingInfo.get_num_video_tokens", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen2VLProcessingInfo.get_image_size_with_most_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen2VLProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen2VLProcessingInfo._get_max_video_frames", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen2VLProcessingInfo.get_num_frames_with_most_features", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen2VLProcessingInfo.get_max_video_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 41, "n_typed": 39, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 27, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen2_vl.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen2_vl", "names": [ "vllm.model_executor.models.qwen2_vl.Qwen2VLDummyInputsBuilder", "vllm.model_executor.models.qwen2_vl.Qwen2VLForConditionalGeneration", "vllm.model_executor.models.qwen2_vl.Qwen2VLImageEmbeddingInputs", "vllm.model_executor.models.qwen2_vl.Qwen2VLImageInputs", "vllm.model_executor.models.qwen2_vl.Qwen2VLImagePixelInputs", "vllm.model_executor.models.qwen2_vl.Qwen2VLMultiModalDataParser", "vllm.model_executor.models.qwen2_vl.Qwen2VLMultiModalProcessor", "vllm.model_executor.models.qwen2_vl.Qwen2VLProcessingInfo", "vllm.model_executor.models.qwen2_vl.Qwen2VLVideoEmbeddingInputs", "vllm.model_executor.models.qwen2_vl.Qwen2VLVideoInputs", "vllm.model_executor.models.qwen2_vl.Qwen2VLVideoPixelInputs", "vllm.model_executor.models.qwen2_vl.Qwen2VisionAttention", "vllm.model_executor.models.qwen2_vl.Qwen2VisionBlock", "vllm.model_executor.models.qwen2_vl.Qwen2VisionMLP", "vllm.model_executor.models.qwen2_vl.Qwen2VisionPatchEmbed", "vllm.model_executor.models.qwen2_vl.Qwen2VisionPatchMerger", "vllm.model_executor.models.qwen2_vl.Qwen2VisionTransformer", "vllm.model_executor.models.qwen2_vl.Tarsier2ForConditionalGeneration", "vllm.model_executor.models.qwen2_vl.Tarsier2ImageProcessor", "vllm.model_executor.models.qwen2_vl.Tarsier2MultiModalProcessor", "vllm.model_executor.models.qwen2_vl.Tarsier2ProcessingInfo", "vllm.model_executor.models.qwen2_vl.Tarsier2Processor", "vllm.model_executor.models.qwen2_vl.logger" ], "n_typable": 237, "n_typed": 186, "n_any": 0, "n_untyped": 51, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 59, "n_method_overloads": 59, "n_method_params": 121, "n_classes": 20, "n_attrs": 56, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen3.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.qwen3.Qwen3Model", "methods": [ { "kind": "function", "name": "Qwen3Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen3.ALL_DECODER_LAYER_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3.Qwen3ForCausalLM", "methods": [ { "kind": "function", "name": "Qwen3ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3ForCausalLM.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3ForCausalLM.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3ForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 16, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 10, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3.Qwen3Attention", "methods": [ { "kind": "function", "name": "Qwen3Attention.__init__", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "Qwen3Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Attention.dual_chunk_attention_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Attention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Attention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 17, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 15, "n_attrs": 16, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3.Qwen3DecoderLayer", "methods": [ { "kind": "function", "name": "Qwen3DecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3DecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen3.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen3", "names": [ "vllm.model_executor.models.qwen3.ALL_DECODER_LAYER_TYPES", "vllm.model_executor.models.qwen3.Qwen3Attention", "vllm.model_executor.models.qwen3.Qwen3DecoderLayer", "vllm.model_executor.models.qwen3.Qwen3ForCausalLM", "vllm.model_executor.models.qwen3.Qwen3Model", "vllm.model_executor.models.qwen3.logger" ], "n_typable": 74, "n_typed": 44, "n_any": 0, "n_untyped": 30, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 34, "n_classes": 4, "n_attrs": 31, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen3_5.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.qwen3_5.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_5.Qwen3_5ForCausalLM", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_5.Qwen3_5ProcessingInfo", "methods": [ { "kind": "function", "name": "Qwen3_5ProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_5.Qwen3_5ForConditionalGeneration", "methods": [ { "kind": "function", "name": "Qwen3_5ForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3_5ForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3_5ForConditionalGeneration.recompute_mrope_positions", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3_5ForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen3_5ForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3_5ForConditionalGeneration.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3_5ForConditionalGeneration.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3_5ForConditionalGeneration.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_5ForConditionalGeneration.supports_multimodal_pruning", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5ForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5ForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5ForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5ForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5ForConditionalGeneration.is_multimodal_pruning_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5ForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5ForConditionalGeneration.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5ForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 20, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 16, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_5.Qwen3_5Model", "methods": [ { "kind": "function", "name": "Qwen3_5Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3_5Model.load_fused_expert_weights", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen3_5Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_5Model.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 10, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_5.Qwen3_5MoeForCausalLM", "methods": [ { "kind": "function", "name": "Qwen3_5MoeForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3_5MoeForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_5.Qwen3_5GatedDeltaNet", "methods": [ { "kind": "function", "name": "Qwen3_5GatedDeltaNet.fix_query_key_value_ordering", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3_5GatedDeltaNet.create_qkvz_proj", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen3_5GatedDeltaNet.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 10, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_5.Qwen3_5_MoeMixtureOfExperts", "methods": [ { "kind": "function", "name": "Qwen3_5_MoeMixtureOfExperts.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3_5_MoeMixtureOfExperts.set_moe_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_5.Qwen3_5ForCausalLMBase", "methods": [ { "kind": "function", "name": "Qwen3_5ForCausalLMBase.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3_5ForCausalLMBase.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3_5ForCausalLMBase.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen3_5ForCausalLMBase.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3_5ForCausalLMBase.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_5ForCausalLMBase.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5ForCausalLMBase.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5ForCausalLMBase.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5ForCausalLMBase.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5ForCausalLMBase.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5ForCausalLMBase.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5ForCausalLMBase.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5ForCausalLMBase.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5ForCausalLMBase.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5ForCausalLMBase.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 13, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_5.Qwen3_5DecoderLayer", "methods": [ { "kind": "function", "name": "Qwen3_5DecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_5DecoderLayer.layer_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5DecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5DecoderLayer.layer_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5DecoderLayer.linear_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5DecoderLayer.attn_layer_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5DecoderLayer.ffn_layer_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 4, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_5.Qwen3_5MoeProcessingInfo", "methods": [ { "kind": "function", "name": "Qwen3_5MoeProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_5.Qwen3_5MoeForConditionalGeneration", "methods": [ { "kind": "function", "name": "Qwen3_5MoeForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_5MoeForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeForConditionalGeneration.is_multimodal_pruning_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeForConditionalGeneration.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 2, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen3_5", "names": [ "vllm.model_executor.models.qwen3_5.Qwen3_5DecoderLayer", "vllm.model_executor.models.qwen3_5.Qwen3_5ForCausalLM", "vllm.model_executor.models.qwen3_5.Qwen3_5ForCausalLMBase", "vllm.model_executor.models.qwen3_5.Qwen3_5ForConditionalGeneration", "vllm.model_executor.models.qwen3_5.Qwen3_5GatedDeltaNet", "vllm.model_executor.models.qwen3_5.Qwen3_5Model", "vllm.model_executor.models.qwen3_5.Qwen3_5MoeForCausalLM", "vllm.model_executor.models.qwen3_5.Qwen3_5MoeForConditionalGeneration", "vllm.model_executor.models.qwen3_5.Qwen3_5MoeProcessingInfo", "vllm.model_executor.models.qwen3_5.Qwen3_5ProcessingInfo", "vllm.model_executor.models.qwen3_5.Qwen3_5_MoeMixtureOfExperts", "vllm.model_executor.models.qwen3_5.logger" ], "n_typable": 119, "n_typed": 65, "n_any": 0, "n_untyped": 54, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 27, "n_method_overloads": 27, "n_method_params": 52, "n_classes": 11, "n_attrs": 43, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen3_5_mtp.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.qwen3_5_mtp.Qwen3_5MoeMTP", "methods": [ { "kind": "function", "name": "Qwen3_5MoeMTP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen3_5_mtp.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_5_mtp.Qwen3_5MultiTokenPredictor", "methods": [ { "kind": "function", "name": "Qwen3_5MultiTokenPredictor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3_5MultiTokenPredictor.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3_5MultiTokenPredictor.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Qwen3_5MultiTokenPredictor.load_fused_expert_weights", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen3_5MultiTokenPredictor.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_5MultiTokenPredictor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MultiTokenPredictor.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MultiTokenPredictor.mtp_start_layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MultiTokenPredictor.num_mtp_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MultiTokenPredictor.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MultiTokenPredictor.fc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MultiTokenPredictor.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MultiTokenPredictor.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MultiTokenPredictor.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MultiTokenPredictor.pre_fc_norm_hidden", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MultiTokenPredictor.pre_fc_norm_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 19, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 15, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_5_mtp.Qwen3_5MTP", "methods": [ { "kind": "function", "name": "Qwen3_5MTP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3_5MTP.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3_5MTP.forward", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Qwen3_5MTP.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3_5MTP.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_5MTP.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5MTP.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MTP.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MTP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MTP.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MTP.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MTP.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 18, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 15, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen3_5_mtp", "names": [ "vllm.model_executor.models.qwen3_5_mtp.Qwen3_5MTP", "vllm.model_executor.models.qwen3_5_mtp.Qwen3_5MoeMTP", "vllm.model_executor.models.qwen3_5_mtp.Qwen3_5MultiTokenPredictor", "vllm.model_executor.models.qwen3_5_mtp.logger" ], "n_typable": 61, "n_typed": 39, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 32, "n_classes": 3, "n_attrs": 19, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen3_asr.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.qwen3_asr.Qwen3ASRDummyInputsBuilder", "methods": [ { "kind": "function", "name": "Qwen3ASRDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3ASRDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_asr.Qwen3ASRProcessingInfo", "methods": [ { "kind": "function", "name": "Qwen3ASRProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3ASRProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3ASRProcessingInfo.get_feature_extractor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3ASRProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3ASRProcessingInfo.get_data_parser", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_asr.Qwen3ASRMultiModalDataParser", "methods": [ { "kind": "function", "name": "Qwen3ASRMultiModalDataParser._parse_audio_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_asr.Qwen3ASRForConditionalGeneration", "methods": [ { "kind": "function", "name": "Qwen3ASRForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3ASRForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3ASRForConditionalGeneration._parse_and_validate_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3ASRForConditionalGeneration._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3ASRForConditionalGeneration._process_audio_input", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3ASRForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3ASRForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3ASRForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen3ASRForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3ASRForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3ASRForConditionalGeneration.get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3ASRForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3ASRForConditionalGeneration.get_speech_to_text_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3ASRForConditionalGeneration.get_generation_prompt", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Qwen3ASRForConditionalGeneration.post_process_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3ASRForConditionalGeneration.supported_languages", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3ASRForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRForConditionalGeneration.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRForConditionalGeneration.audio_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 56, "n_typed": 47, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 33, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_asr.Qwen3ASRMultiModalProcessor", "methods": [ { "kind": "function", "name": "Qwen3ASRMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3ASRMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen3_asr.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen3_asr", "names": [ "vllm.model_executor.models.qwen3_asr.Qwen3ASRDummyInputsBuilder", "vllm.model_executor.models.qwen3_asr.Qwen3ASRForConditionalGeneration", "vllm.model_executor.models.qwen3_asr.Qwen3ASRMultiModalDataParser", "vllm.model_executor.models.qwen3_asr.Qwen3ASRMultiModalProcessor", "vllm.model_executor.models.qwen3_asr.Qwen3ASRProcessingInfo", "vllm.model_executor.models.qwen3_asr.logger" ], "n_typable": 79, "n_typed": 68, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 25, "n_method_overloads": 25, "n_method_params": 45, "n_classes": 5, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen3_asr_realtime.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.qwen3_asr_realtime.Qwen3ASRRealtimeMultiModalProcessor", "methods": [ { "kind": "function", "name": "Qwen3ASRRealtimeMultiModalProcessor.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3ASRRealtimeMultiModalProcessor._maybe_apply_prompt_updates", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_asr_realtime.Qwen3ASRRealtimeGeneration", "methods": [ { "kind": "function", "name": "Qwen3ASRRealtimeGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3ASRRealtimeGeneration.buffer_realtime_audio", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3ASRRealtimeGeneration.get_speech_to_text_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3ASRRealtimeGeneration.realtime_max_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_asr_realtime.Qwen3ASRRealtimeBuffer", "methods": [ { "kind": "function", "name": "Qwen3ASRRealtimeBuffer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3ASRRealtimeBuffer.write_audio", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3ASRRealtimeBuffer.read_audio", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3ASRRealtimeBuffer.flush", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen3_asr_realtime.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen3_asr_realtime", "names": [ "vllm.model_executor.models.qwen3_asr_realtime.Qwen3ASRRealtimeBuffer", "vllm.model_executor.models.qwen3_asr_realtime.Qwen3ASRRealtimeGeneration", "vllm.model_executor.models.qwen3_asr_realtime.Qwen3ASRRealtimeMultiModalProcessor", "vllm.model_executor.models.qwen3_asr_realtime.logger" ], "n_typable": 28, "n_typed": 25, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 18, "n_classes": 3, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen3_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.qwen3_moe.Qwen3MoeAttention", "methods": [ { "kind": "function", "name": "Qwen3MoeAttention.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "Qwen3MoeAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3MoeAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.dual_chunk_attention_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeAttention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 16, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 14, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_moe.Qwen3MoeDecoderLayer", "methods": [ { "kind": "function", "name": "Qwen3MoeDecoderLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3MoeDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3MoeDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_moe.Qwen3MoeSparseMoeBlock", "methods": [ { "kind": "function", "name": "Qwen3MoeSparseMoeBlock.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3MoeSparseMoeBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.n_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.is_sequence_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.shared_expert_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeSparseMoeBlock.shared_expert", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 4, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_moe.Qwen3MoeMLP", "methods": [ { "kind": "function", "name": "Qwen3MoeMLP.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Qwen3MoeMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3MoeMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeMLP.expert_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 8, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_moe.Qwen3MoeForCausalLM", "methods": [ { "kind": "function", "name": "Qwen3MoeForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3MoeForCausalLM.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3MoeForCausalLM.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3MoeForCausalLM.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3MoeForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3MoeForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3MoeForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3MoeForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3MoeForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3MoeForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.fall_back_to_pt_during_load", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.expert_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.num_expert_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.num_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.num_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.num_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.num_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.num_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeForCausalLM.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 37, "n_typed": 20, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 12, "n_attrs": 19, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen3_moe.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_moe.Qwen3MoeModel", "methods": [ { "kind": "function", "name": "Qwen3MoeModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3MoeModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3MoeModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3MoeModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3MoeModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3MoeModel.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeModel.aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 22, "n_typed": 14, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen3_moe", "names": [ "vllm.model_executor.models.qwen3_moe.Qwen3MoeAttention", "vllm.model_executor.models.qwen3_moe.Qwen3MoeDecoderLayer", "vllm.model_executor.models.qwen3_moe.Qwen3MoeForCausalLM", "vllm.model_executor.models.qwen3_moe.Qwen3MoeMLP", "vllm.model_executor.models.qwen3_moe.Qwen3MoeModel", "vllm.model_executor.models.qwen3_moe.Qwen3MoeSparseMoeBlock", "vllm.model_executor.models.qwen3_moe.logger" ], "n_typable": 141, "n_typed": 69, "n_any": 0, "n_untyped": 72, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 22, "n_method_overloads": 22, "n_method_params": 51, "n_classes": 6, "n_attrs": 71, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen3_next.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.qwen3_next.fused_gdn_gating_kernel", "n_typed": 4, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "vllm.model_executor.models.qwen3_next.gdn_attention_core_fake", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_next.ChunkGatedDeltaRule", "methods": [ { "kind": "function", "name": "ChunkGatedDeltaRule.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ChunkGatedDeltaRule.forward_cuda", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "ChunkGatedDeltaRule.forward_native", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "properties": [], "attrs": [], "n_typable": 21, "n_typed": 19, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 18, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_next.Qwen3NextSparseMoeBlock", "methods": [ { "kind": "function", "name": "Qwen3NextSparseMoeBlock.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3NextSparseMoeBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.ep_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.n_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.is_sequence_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.shared_expert_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextSparseMoeBlock.shared_expert", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 4, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 17, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen3_next.KVCache", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_next.Qwen3NextModel", "methods": [ { "kind": "function", "name": "Qwen3NextModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3NextModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3NextModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3NextModel.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3NextModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3NextModel.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 12, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_next.QwenNextMixtureOfExperts", "methods": [ { "kind": "function", "name": "QwenNextMixtureOfExperts.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QwenNextMixtureOfExperts.set_moe_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_next.Qwen3NextGatedDeltaNet", "methods": [ { "kind": "function", "name": "Qwen3NextGatedDeltaNet.get_state_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3NextGatedDeltaNet.get_state_shape", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3NextGatedDeltaNet.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Qwen3NextGatedDeltaNet.create_qkvz_proj", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen3NextGatedDeltaNet.fix_query_key_value_ordering", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3NextGatedDeltaNet.rearrange_mixed_qkv", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3NextGatedDeltaNet.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3NextGatedDeltaNet._forward_core", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "Qwen3NextGatedDeltaNet.mamba_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.tp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.num_v_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.num_k_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.head_k_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.head_v_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.key_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.value_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.conv_kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.layer_norm_epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.speculative_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.num_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.conv_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.conv1d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.in_proj_qkvz", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.in_proj_ba", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.dt_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.A_log", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextGatedDeltaNet.chunk_gated_delta_rule", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 59, "n_typed": 24, "n_any": 0, "n_untyped": 35, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 20, "n_attrs": 30, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_next.Qwen3NextDecoderLayer", "methods": [ { "kind": "function", "name": "Qwen3NextDecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3NextDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3NextDecoderLayer.layer_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextDecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextDecoderLayer.layer_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextDecoderLayer.linear_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextDecoderLayer.attn_layer_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextDecoderLayer.ffn_layer_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 8, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_next.Qwen3NextForCausalLM", "methods": [ { "kind": "function", "name": "Qwen3NextForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3NextForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3NextForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen3NextForCausalLM.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3NextForCausalLM.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3NextForCausalLM.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3NextForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3NextForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3NextForCausalLM.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3NextForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3NextForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextForCausalLM.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextForCausalLM.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 19, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 12, "n_attrs": 10, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.qwen3_next.fi_chunk_gated_delta_rule", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.model_executor.models.qwen3_next.gdn_attention_core", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.model_executor.models.qwen3_next.fused_gdn_gating", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_next.Qwen3NextAttention", "methods": [ { "kind": "function", "name": "Qwen3NextAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen3NextAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3NextAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.dual_chunk_attention_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.attn_output_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextAttention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 9, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 18, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen3_next.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen3_next", "names": [ "vllm.model_executor.models.qwen3_next.ChunkGatedDeltaRule", "vllm.model_executor.models.qwen3_next.KVCache", "vllm.model_executor.models.qwen3_next.Qwen3NextAttention", "vllm.model_executor.models.qwen3_next.Qwen3NextDecoderLayer", "vllm.model_executor.models.qwen3_next.Qwen3NextForCausalLM", "vllm.model_executor.models.qwen3_next.Qwen3NextGatedDeltaNet", "vllm.model_executor.models.qwen3_next.Qwen3NextModel", "vllm.model_executor.models.qwen3_next.Qwen3NextSparseMoeBlock", "vllm.model_executor.models.qwen3_next.QwenNextMixtureOfExperts", "vllm.model_executor.models.qwen3_next.fi_chunk_gated_delta_rule", "vllm.model_executor.models.qwen3_next.fused_gdn_gating", "vllm.model_executor.models.qwen3_next.fused_gdn_gating_kernel", "vllm.model_executor.models.qwen3_next.gdn_attention_core", "vllm.model_executor.models.qwen3_next.gdn_attention_core_fake", "vllm.model_executor.models.qwen3_next.logger" ], "n_typable": 244, "n_typed": 130, "n_any": 0, "n_untyped": 114, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 36, "n_methods": 33, "n_method_overloads": 33, "n_method_params": 78, "n_classes": 8, "n_attrs": 93, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen3_next_mtp.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.qwen3_next_mtp.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_next_mtp.Qwen3NextMultiTokenPredictor", "methods": [ { "kind": "function", "name": "Qwen3NextMultiTokenPredictor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3NextMultiTokenPredictor.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3NextMultiTokenPredictor.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Qwen3NextMultiTokenPredictor.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3NextMultiTokenPredictor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextMultiTokenPredictor.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextMultiTokenPredictor.mtp_start_layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextMultiTokenPredictor.num_mtp_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextMultiTokenPredictor.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextMultiTokenPredictor.fc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextMultiTokenPredictor.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextMultiTokenPredictor.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextMultiTokenPredictor.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextMultiTokenPredictor.pre_fc_norm_hidden", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextMultiTokenPredictor.pre_fc_norm_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 13, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 11, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen3_next_mtp.KVCache", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_next_mtp.Qwen3NextMTP", "methods": [ { "kind": "function", "name": "Qwen3NextMTP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3NextMTP.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3NextMTP.forward", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Qwen3NextMTP.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3NextMTP.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3NextMTP.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3NextMTP.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextMTP.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextMTP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextMTP.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextMTP.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextMTP.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 15, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen3_next_mtp", "names": [ "vllm.model_executor.models.qwen3_next_mtp.KVCache", "vllm.model_executor.models.qwen3_next_mtp.Qwen3NextMTP", "vllm.model_executor.models.qwen3_next_mtp.Qwen3NextMultiTokenPredictor", "vllm.model_executor.models.qwen3_next_mtp.logger" ], "n_typable": 49, "n_typed": 28, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 22, "n_classes": 2, "n_attrs": 20, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen3_omni_moe_thinker.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3OmniMoeThinkerProcessingInfo", "methods": [ { "kind": "function", "name": "Qwen3OmniMoeThinkerProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerProcessingInfo.get_feature_extractor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3MoeLLMModel", "methods": [ { "kind": "function", "name": "Qwen3MoeLLMModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3MoeLLMModel.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3MoeLLMModel.deepstack_multiscale_layer_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.SinusoidsPositionEmbedding", "methods": [ { "kind": "function", "name": "SinusoidsPositionEmbedding.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SinusoidsPositionEmbedding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SinusoidsPositionEmbedding.length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SinusoidsPositionEmbedding.channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SinusoidsPositionEmbedding.max_timescale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 5, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3_VisionMLP", "methods": [ { "kind": "function", "name": "Qwen3_VisionMLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Qwen3_VisionMLP.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_VisionMLP.linear_fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionMLP.linear_fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3OmniMoeAudioEncoder", "methods": [ { "kind": "function", "name": "Qwen3OmniMoeAudioEncoder.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3OmniMoeAudioEncoder.compute_attn_mask_seqlen", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3OmniMoeAudioEncoder.forward", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3OmniMoeAudioEncoder._get_cnn_output_lengths", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3OmniMoeAudioEncoder.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Qwen3OmniMoeAudioEncoder.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Qwen3OmniMoeAudioEncoder.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.num_mel_bins", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.max_source_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.n_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.n_window_infer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.conv_chunksize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.positional_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.conv2d1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.conv2d2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.conv2d3", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.conv_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.ln_post", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.proj1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.proj2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoder.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 13, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 16, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3_VisionPatchEmbed", "methods": [ { "kind": "function", "name": "Qwen3_VisionPatchEmbed.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3_VisionPatchEmbed.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_VisionPatchEmbed.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionPatchEmbed.temporal_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionPatchEmbed.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionPatchEmbed.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.ISO639_1_SUPPORTED_LANGS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3OmniMoeAudioEncoderLayer", "methods": [ { "kind": "function", "name": "Qwen3OmniMoeAudioEncoderLayer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3OmniMoeAudioEncoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoderLayer.self_attn_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoderLayer.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoderLayer.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoderLayer.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioEncoderLayer.final_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 6, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3MoeLLMForCausalLM", "methods": [ { "kind": "function", "name": "Qwen3MoeLLMForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3MoeLLMForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeLLMForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeLLMForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeLLMForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeLLMForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeLLMForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 2, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3OmniMoeAudioAttention", "methods": [ { "kind": "function", "name": "Qwen3OmniMoeAudioAttention.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3OmniMoeAudioAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3OmniMoeAudioAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioAttention.num_local_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioAttention.qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeAudioAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 6, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3OmniMoeThinkerForConditionalGeneration", "methods": [ { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration._get_deepstack_input_embeds", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration._set_deepstack_input_embeds", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration._clear_deepstack_input_embeds", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration._compute_audio_token_count", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration._get_audio_for_video_mapping", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.iter_mm_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration._compute_interleaved_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.get_speech_to_text_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.get_generation_prompt", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.supported_languages", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.use_deepstack", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.deepstack_num_level", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.visual_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.multiscale_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.audio_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3OmniMoeThinkerForConditionalGeneration.deepstack_input_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 69, "n_typed": 54, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 36, "n_attrs": 16, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3_VisionBlock", "methods": [ { "kind": "function", "name": "Qwen3_VisionBlock.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Qwen3_VisionBlock.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_VisionBlock.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionBlock.norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 15, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 13, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3OmniMoeConditionalGenerationMixin", "methods": [ { "kind": "function", "name": "Qwen3OmniMoeConditionalGenerationMixin._process_audio_input", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3Omni_VisionTransformer", "methods": [ { "kind": "function", "name": "Qwen3Omni_VisionTransformer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3Omni_VisionTransformer.rot_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3Omni_VisionTransformer.fast_pos_embed_interpolate", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3Omni_VisionTransformer.compute_attn_mask_seqlen", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3Omni_VisionTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3Omni_VisionTransformer.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Qwen3Omni_VisionTransformer.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Qwen3Omni_VisionTransformer.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.spatial_merge_unit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.temporal_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.num_grid_per_side", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.apply_vit_abs_pos_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.deepstack_visual_indexes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.patch_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.rotary_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.merger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.pos_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3Omni_VisionTransformer.merger_list", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 15, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 10, "n_attrs": 17, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3OmniMoeThinkerMultiModalProcessor", "methods": [ { "kind": "function", "name": "Qwen3OmniMoeThinkerMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerMultiModalProcessor._maybe_apply_prompt_updates", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerMultiModalProcessor.get_updates_use_audio_in_video", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerMultiModalProcessor._derive_audio_from_video_placeholders", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3OmniMoeThinkerMultiModalProcessor._get_raw_input_ids", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 26, "n_typed": 26, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 20, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3_VisionPatchMerger", "methods": [ { "kind": "function", "name": "Qwen3_VisionPatchMerger.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Qwen3_VisionPatchMerger.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_VisionPatchMerger.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionPatchMerger.use_postshuffle_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionPatchMerger.ln_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionPatchMerger.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 10, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen3_omni_moe_thinker", "names": [ "vllm.model_executor.models.qwen3_omni_moe_thinker.ISO639_1_SUPPORTED_LANGS", "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3MoeLLMForCausalLM", "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3MoeLLMModel", "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3OmniMoeAudioAttention", "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3OmniMoeAudioEncoder", "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3OmniMoeAudioEncoderLayer", "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3OmniMoeConditionalGenerationMixin", "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3OmniMoeThinkerForConditionalGeneration", "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3OmniMoeThinkerMultiModalProcessor", "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3OmniMoeThinkerProcessingInfo", "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3Omni_VisionTransformer", "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3_VisionBlock", "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3_VisionMLP", "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3_VisionPatchEmbed", "vllm.model_executor.models.qwen3_omni_moe_thinker.Qwen3_VisionPatchMerger", "vllm.model_executor.models.qwen3_omni_moe_thinker.SinusoidsPositionEmbedding", "vllm.model_executor.models.qwen3_omni_moe_thinker.logger" ], "n_typable": 288, "n_typed": 185, "n_any": 0, "n_untyped": 103, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 59, "n_method_overloads": 59, "n_method_params": 137, "n_classes": 15, "n_attrs": 91, "n_properties": 4, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen3_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl.Qwen3_VisionTransformer", "methods": [ { "kind": "function", "name": "Qwen3_VisionTransformer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3_VisionTransformer.rot_pos_ids", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3_VisionTransformer.rot_pos_emb", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3_VisionTransformer.fast_pos_embed_interpolate", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3_VisionTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3_VisionTransformer.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Qwen3_VisionTransformer.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Qwen3_VisionTransformer.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Qwen3_VisionTransformer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.num_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.spatial_merge_unit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.temporal_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.deepstack_visual_indexes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.num_grid_per_side", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.out_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.patch_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.pos_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.rotary_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.merger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.deepstack_merger_list", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.attn_backend", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionTransformer.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 38, "n_typed": 19, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_attrs": 18, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl.Qwen3LLMModel", "methods": [ { "kind": "function", "name": "Qwen3LLMModel.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl.Qwen3VLMultiModalProcessor", "methods": [ { "kind": "function", "name": "Qwen3VLMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3VLMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3VLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3VLMultiModalProcessor.get_video_repl", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [], "n_typable": 20, "n_typed": 20, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 16, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl.Qwen3_VisionMLP", "methods": [ { "kind": "function", "name": "Qwen3_VisionMLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Qwen3_VisionMLP.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_VisionMLP.linear_fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionMLP.linear_fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl.Qwen3VLProcessingInfo", "methods": [ { "kind": "function", "name": "Qwen3VLProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3VLProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLProcessingInfo.get_image_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLProcessingInfo.get_video_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3VLProcessingInfo._get_vision_info", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Qwen3VLProcessingInfo._get_max_video_frames", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3VLProcessingInfo.get_num_frames_with_most_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3VLProcessingInfo.get_max_video_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3VLProcessingInfo._calculate_timestamps", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3VLProcessingInfo._get_video_second_idx", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 32, "n_typed": 29, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 21, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl.Qwen3_VisionPatchEmbed", "methods": [ { "kind": "function", "name": "Qwen3_VisionPatchEmbed.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3_VisionPatchEmbed.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_VisionPatchEmbed.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionPatchEmbed.temporal_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionPatchEmbed.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionPatchEmbed.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen3_vl.DUMMY_VIDEO_NUM_FRAMES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl.Qwen3LLMForCausalLM", "methods": [ { "kind": "function", "name": "Qwen3LLMForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3LLMForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3LLMForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3LLMForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3LLMForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3LLMForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3LLMForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 2, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl.Qwen3VLForConditionalGeneration", "methods": [ { "kind": "function", "name": "Qwen3VLForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._get_deepstack_input_embeds", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._set_deepstack_input_embeds", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._clear_deepstack_input_embeds", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._parse_and_validate_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._process_video_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._postprocess_image_embeds_evs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._postprocess_video_embeds_evs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._create_final_video_embeddings", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._get_expanded_positions", "n_typed": 0, "n_any": 0, "n_untyped": 9, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._parse_and_validate_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._iter_mm_grid_hw", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._get_evs_mask_segments", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._extract_frame_offsets_from_mask", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._get_actual_frame_token_counts", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration.get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration.recompute_mrope_positions", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._recompute_mrope_positions", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration._compute_deepstack_embeds", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration.get_num_mm_encoder_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLForConditionalGeneration.get_num_mm_connector_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.video_pruning_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.is_multimodal_pruning_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.use_deepstack", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.deepstack_num_level", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.visual_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.multiscale_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLForConditionalGeneration.deepstack_input_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 122, "n_typed": 97, "n_any": 0, "n_untyped": 25, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 33, "n_method_overloads": 33, "n_method_params": 75, "n_attrs": 16, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl.Qwen3_VisionPatchMerger", "methods": [ { "kind": "function", "name": "Qwen3_VisionPatchMerger.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Qwen3_VisionPatchMerger.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_VisionPatchMerger.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionPatchMerger.use_postshuffle_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionPatchMerger.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionPatchMerger.linear_fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionPatchMerger.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionPatchMerger.linear_fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 10, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl.Qwen3_VisionBlock", "methods": [ { "kind": "function", "name": "Qwen3_VisionBlock.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Qwen3_VisionBlock.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_VisionBlock.norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionBlock.norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_VisionBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 15, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 13, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen3_vl.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl.Qwen3VLDummyInputsBuilder", "methods": [ { "kind": "function", "name": "Qwen3VLDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3VLDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3VLDummyInputsBuilder._get_dummy_videos", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen3_vl", "names": [ "vllm.model_executor.models.qwen3_vl.DUMMY_VIDEO_NUM_FRAMES", "vllm.model_executor.models.qwen3_vl.Qwen3LLMForCausalLM", "vllm.model_executor.models.qwen3_vl.Qwen3LLMModel", "vllm.model_executor.models.qwen3_vl.Qwen3VLDummyInputsBuilder", "vllm.model_executor.models.qwen3_vl.Qwen3VLForConditionalGeneration", "vllm.model_executor.models.qwen3_vl.Qwen3VLMultiModalProcessor", "vllm.model_executor.models.qwen3_vl.Qwen3VLProcessingInfo", "vllm.model_executor.models.qwen3_vl.Qwen3_VisionBlock", "vllm.model_executor.models.qwen3_vl.Qwen3_VisionMLP", "vllm.model_executor.models.qwen3_vl.Qwen3_VisionPatchEmbed", "vllm.model_executor.models.qwen3_vl.Qwen3_VisionPatchMerger", "vllm.model_executor.models.qwen3_vl.Qwen3_VisionTransformer", "vllm.model_executor.models.qwen3_vl.logger" ], "n_typable": 297, "n_typed": 223, "n_any": 0, "n_untyped": 74, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 67, "n_method_overloads": 67, "n_method_params": 172, "n_classes": 11, "n_attrs": 59, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen3_vl_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl_moe.Qwen3VLMoeProcessingInfo", "methods": [ { "kind": "function", "name": "Qwen3VLMoeProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl_moe.Qwen3MoeLLMModel", "methods": [ { "kind": "function", "name": "Qwen3MoeLLMModel.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen3MoeLLMModel.load_fused_expert_weights", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Qwen3MoeLLMModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 14, "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl_moe.Qwen3VLMoeForConditionalGeneration", "methods": [ { "kind": "function", "name": "Qwen3VLMoeForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3VLMoeForConditionalGeneration.is_3d_moe_weight", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLMoeForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLMoeForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLMoeForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLMoeForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLMoeForConditionalGeneration.video_pruning_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLMoeForConditionalGeneration.is_multimodal_pruning_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLMoeForConditionalGeneration.use_deepstack", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLMoeForConditionalGeneration.deepstack_num_level", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLMoeForConditionalGeneration.visual_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLMoeForConditionalGeneration.multiscale_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLMoeForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLMoeForConditionalGeneration.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLMoeForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3VLMoeForConditionalGeneration.deepstack_input_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 3, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl_moe.Qwen3VLMoeMixtureOfExperts", "methods": [ { "kind": "function", "name": "Qwen3VLMoeMixtureOfExperts.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3VLMoeMixtureOfExperts.set_moe_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen3_vl_moe.Qwen3MoeLLMForCausalLM", "methods": [ { "kind": "function", "name": "Qwen3MoeLLMForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3MoeLLMForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeLLMForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeLLMForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeLLMForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeLLMForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3MoeLLMForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 2, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen3_vl_moe.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen3_vl_moe", "names": [ "vllm.model_executor.models.qwen3_vl_moe.Qwen3MoeLLMForCausalLM", "vllm.model_executor.models.qwen3_vl_moe.Qwen3MoeLLMModel", "vllm.model_executor.models.qwen3_vl_moe.Qwen3VLMoeForConditionalGeneration", "vllm.model_executor.models.qwen3_vl_moe.Qwen3VLMoeMixtureOfExperts", "vllm.model_executor.models.qwen3_vl_moe.Qwen3VLMoeProcessingInfo", "vllm.model_executor.models.qwen3_vl_moe.logger" ], "n_typable": 47, "n_typed": 22, "n_any": 0, "n_untyped": 25, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 17, "n_classes": 5, "n_attrs": 22, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/qwen_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.qwen_vl.QwenVLDummyInputsBuilder", "methods": [ { "kind": "function", "name": "QwenVLDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QwenVLDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen_vl.QwenImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "QwenImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "QwenImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen_vl.TransformerBlock", "methods": [ { "kind": "function", "name": "TransformerBlock.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "TransformerBlock.get_cast_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TransformerBlock.get_cast_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TransformerBlock.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TransformerBlock.width", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerBlock.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TransformerBlock.resblocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 12, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen_vl.QwenImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "QwenImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "QwenImagePixelInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen_vl.QwenVLMultiModalProcessor", "methods": [ { "kind": "function", "name": "QwenVLMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "QwenVLMultiModalProcessor._hf_processor_applies_updates", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "QwenVLMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QwenVLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 17, "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen_vl.QwenVLMLP", "methods": [ { "kind": "function", "name": "QwenVLMLP.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "QwenVLMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QwenVLMLP.c_fc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QwenVLMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QwenVLMLP.c_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 4, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen_vl.VisionTransformer", "methods": [ { "kind": "function", "name": "VisionTransformer.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "VisionTransformer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VisionTransformer.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.grid_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.output_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.conv1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.positional_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.ln_pre", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.attn_pool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.ln_post", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.image_start_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.image_end_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionTransformer.image_pad_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 13, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 13, "n_attrs": 14, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.qwen_vl.QwenImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.qwen_vl.VisualAttentionBlock", "methods": [ { "kind": "function", "name": "VisualAttentionBlock.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "VisualAttentionBlock.attention", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VisualAttentionBlock.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VisualAttentionBlock.ln_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualAttentionBlock.ln_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualAttentionBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualAttentionBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen_vl.QwenVLProcessor", "methods": [ { "kind": "function", "name": "QwenVLProcessor.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QwenVLProcessor.__call__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "QwenVLProcessor.image_start_tag", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "QwenVLProcessor.image_end_tag", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "QwenVLProcessor.image_pad_tag", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "QwenVLProcessor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QwenVLProcessor.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "QwenVLProcessor.image_transform", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 10, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 3, "n_properties": 3 }, { "kind": "class", "name": "vllm.model_executor.models.qwen_vl.QwenVLProcessingInfo", "methods": [ { "kind": "function", "name": "QwenVLProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QwenVLProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QwenVLProcessingInfo.get_num_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen_vl.QwenVLForConditionalGeneration", "methods": [ { "kind": "function", "name": "QwenVLForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "QwenVLForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "QwenVLForConditionalGeneration.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "QwenVLForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QwenVLForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QwenVLForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "QwenVLForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QwenVLForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QwenVLForConditionalGeneration.embed_input_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "QwenVLForConditionalGeneration.transformer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 21, "n_typed": 21, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 13, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen_vl.VisualAttention", "methods": [ { "kind": "function", "name": "VisualAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "VisualAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VisualAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualAttention.kdim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualAttention.vdim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualAttention.hidden_size_per_attention_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualAttention.num_attention_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualAttention.hidden_size_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualAttention.in_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisualAttention.norm_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 9, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.qwen_vl.QwenVLModel", "methods": [ { "kind": "function", "name": "QwenVLModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "QwenVLModel.visual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.qwen_vl", "names": [ "vllm.model_executor.models.qwen_vl.QwenImageEmbeddingInputs", "vllm.model_executor.models.qwen_vl.QwenImageInputs", "vllm.model_executor.models.qwen_vl.QwenImagePixelInputs", "vllm.model_executor.models.qwen_vl.QwenVLDummyInputsBuilder", "vllm.model_executor.models.qwen_vl.QwenVLForConditionalGeneration", "vllm.model_executor.models.qwen_vl.QwenVLMLP", "vllm.model_executor.models.qwen_vl.QwenVLModel", "vllm.model_executor.models.qwen_vl.QwenVLMultiModalProcessor", "vllm.model_executor.models.qwen_vl.QwenVLProcessingInfo", "vllm.model_executor.models.qwen_vl.QwenVLProcessor", "vllm.model_executor.models.qwen_vl.TransformerBlock", "vllm.model_executor.models.qwen_vl.VisionTransformer", "vllm.model_executor.models.qwen_vl.VisualAttention", "vllm.model_executor.models.qwen_vl.VisualAttentionBlock" ], "n_typable": 162, "n_typed": 115, "n_any": 0, "n_untyped": 47, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 32, "n_method_overloads": 32, "n_method_params": 83, "n_classes": 13, "n_attrs": 46, "n_properties": 3, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/radio.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.radio.ViTPatchLinear", "methods": [ { "kind": "function", "name": "ViTPatchLinear.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ViTPatchLinear.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.radio.calc_seq_len", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.models.radio.to_4tuple", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.radio.RadioParallelAttention", "methods": [ { "kind": "function", "name": "RadioParallelAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.radio.input_dim_t", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.radio.RadioVisionEncoder", "methods": [ { "kind": "function", "name": "RadioVisionEncoder.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RadioVisionEncoder.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.radio.ClsToken", "methods": [ { "kind": "function", "name": "ClsToken.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ClsToken.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ClsToken.ndim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ClsToken.enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ClsToken.num_registers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ClsToken.num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ClsToken.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ClsToken.token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 6, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.radio.to_2tuple", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.radio.RadioInternVisionModel", "methods": [ { "kind": "function", "name": "RadioInternVisionModel.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "RadioInternVisionModel._init_img_size", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RadioInternVisionModel.get_input_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RadioInternVisionModel.create_inter_image_attention_mask", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RadioInternVisionModel.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RadioInternVisionModel.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RadioInternVisionModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioInternVisionModel.patch_generator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioInternVisionModel.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 13, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 11, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.radio.to_3tuple", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.radio.Im2Patches", "methods": [ { "kind": "function", "name": "Im2Patches.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Im2Patches.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Im2Patches.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.radio.norm_t", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.radio.RadioVisionEncoderLayer", "methods": [ { "kind": "function", "name": "RadioVisionEncoderLayer.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RadioVisionEncoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.radio.calc_seq_lens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.models.radio.to_1tuple", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.radio.ViTPatchGenerator", "methods": [ { "kind": "function", "name": "ViTPatchGenerator.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "ViTPatchGenerator.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ViTPatchGenerator.apply_pos_enc_dynamic", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ViTPatchGenerator.cls_token_dynamic", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ViTPatchGenerator._load_embed", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ViTPatchGenerator._load_projection", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ViTPatchGenerator.embed_patches", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ViTPatchGenerator.apply_pos_enc", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ViTPatchGenerator.get_pos_enc", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ViTPatchGenerator._get_pos_embeddings", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "ViTPatchGenerator.apply_cls_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ViTPatchGenerator.num_cls_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ViTPatchGenerator.num_cls_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ViTPatchGenerator.num_registers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "ViTPatchGenerator.num_skip", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ViTPatchGenerator.cpe_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTPatchGenerator.pos_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTPatchGenerator.return_pos_enc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTPatchGenerator.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTPatchGenerator.abs_pos", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTPatchGenerator.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTPatchGenerator.num_rows", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTPatchGenerator.num_cols", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTPatchGenerator.input_dims", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTPatchGenerator.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTPatchGenerator.max_input_dims", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTPatchGenerator.im_to_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTPatchGenerator.embedder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTPatchGenerator.cls_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTPatchGenerator.patch_normalizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ViTPatchGenerator.pos_embed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 65, "n_typed": 38, "n_any": 0, "n_untyped": 27, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 34, "n_attrs": 16, "n_properties": 5 }, { "kind": "class", "name": "vllm.model_executor.models.radio.RadioModel", "methods": [ { "kind": "function", "name": "RadioModel.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "RadioModel.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RadioModel.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RadioModel._extract_final", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RadioModel.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RadioModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioModel.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioModel.summary_idxs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 14, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.radio", "names": [ "vllm.model_executor.models.radio.ClsToken", "vllm.model_executor.models.radio.Im2Patches", "vllm.model_executor.models.radio.RadioInternVisionModel", "vllm.model_executor.models.radio.RadioModel", "vllm.model_executor.models.radio.RadioParallelAttention", "vllm.model_executor.models.radio.RadioVisionEncoder", "vllm.model_executor.models.radio.RadioVisionEncoderLayer", "vllm.model_executor.models.radio.ViTPatchGenerator", "vllm.model_executor.models.radio.ViTPatchLinear", "vllm.model_executor.models.radio.calc_seq_len", "vllm.model_executor.models.radio.calc_seq_lens", "vllm.model_executor.models.radio.input_dim_t", "vllm.model_executor.models.radio.norm_t", "vllm.model_executor.models.radio.to_1tuple", "vllm.model_executor.models.radio.to_2tuple", "vllm.model_executor.models.radio.to_3tuple", "vllm.model_executor.models.radio.to_4tuple" ], "n_typable": 154, "n_typed": 94, "n_any": 0, "n_untyped": 60, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 4, "n_methods": 29, "n_method_overloads": 29, "n_method_params": 78, "n_classes": 9, "n_attrs": 38, "n_properties": 5, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/roberta.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.roberta.RobertaClassificationHead", "methods": [ { "kind": "function", "name": "RobertaClassificationHead.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RobertaClassificationHead.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RobertaClassificationHead.dense", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RobertaClassificationHead.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.roberta.BgeM3EmbeddingModel", "methods": [ { "kind": "function", "name": "BgeM3EmbeddingModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BgeM3EmbeddingModel._build_pooler", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BgeM3EmbeddingModel.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BgeM3EmbeddingModel.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BgeM3EmbeddingModel.head_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BgeM3EmbeddingModel.bos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BgeM3EmbeddingModel.eos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BgeM3EmbeddingModel.secondary_weight_prefixes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BgeM3EmbeddingModel.secondary_weight_files", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BgeM3EmbeddingModel.secondary_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 5, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.roberta.RobertaEmbeddingModel", "methods": [ { "kind": "function", "name": "RobertaEmbeddingModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RobertaEmbeddingModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "RobertaEmbeddingModel._build_model", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RobertaEmbeddingModel.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RobertaEmbeddingModel.padding_idx", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 14, "n_typed": 12, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.roberta.RobertaForSequenceClassification", "methods": [ { "kind": "function", "name": "RobertaForSequenceClassification.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RobertaForSequenceClassification.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RobertaForSequenceClassification.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RobertaForSequenceClassification.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RobertaForSequenceClassification.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RobertaForSequenceClassification.jina_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RobertaForSequenceClassification.padding_idx", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RobertaForSequenceClassification.num_labels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RobertaForSequenceClassification.roberta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RobertaForSequenceClassification.classifier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RobertaForSequenceClassification.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 12, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.roberta.filter_secondary_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.roberta.RobertaEmbedding", "methods": [ { "kind": "function", "name": "RobertaEmbedding.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RobertaEmbedding.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RobertaEmbedding.size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RobertaEmbedding.word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RobertaEmbedding.padding_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RobertaEmbedding.position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RobertaEmbedding.token_type_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RobertaEmbedding.LayerNorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 5, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.roberta.replace_roberta_positions", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.model_executor.models.roberta", "names": [ "vllm.model_executor.models.roberta.BgeM3EmbeddingModel", "vllm.model_executor.models.roberta.RobertaClassificationHead", "vllm.model_executor.models.roberta.RobertaEmbedding", "vllm.model_executor.models.roberta.RobertaEmbeddingModel", "vllm.model_executor.models.roberta.RobertaForSequenceClassification", "vllm.model_executor.models.roberta.filter_secondary_weights", "vllm.model_executor.models.roberta.replace_roberta_positions" ], "n_typable": 72, "n_typed": 44, "n_any": 0, "n_untyped": 28, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 5, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 28, "n_classes": 5, "n_attrs": 23, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/rvl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.rvl.RForConditionalGeneration", "methods": [ { "kind": "function", "name": "RForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.rvl.RVLDummyInputsBuilder", "methods": [ { "kind": "function", "name": "RVLDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RVLDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.rvl.RVLMultiModalProjector", "methods": [ { "kind": "function", "name": "RVLMultiModalProjector.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RVLMultiModalProjector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RVLMultiModalProjector.pre_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RVLMultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RVLMultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RVLMultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 2, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.rvl.RVLProcessingInfo", "methods": [ { "kind": "function", "name": "RVLProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RVLProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.rvl", "names": [ "vllm.model_executor.models.rvl.RForConditionalGeneration", "vllm.model_executor.models.rvl.RVLDummyInputsBuilder", "vllm.model_executor.models.rvl.RVLMultiModalProjector", "vllm.model_executor.models.rvl.RVLProcessingInfo" ], "n_typable": 22, "n_typed": 12, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 9, "n_classes": 4, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/seed_oss.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.seed_oss.SeedOssDecoderLayer", "methods": [ { "kind": "function", "name": "SeedOssDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SeedOssDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SeedOssDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.seed_oss.SeedOssMLP", "methods": [ { "kind": "function", "name": "SeedOssMLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "SeedOssMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SeedOssMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.seed_oss.SeedOssAttention", "methods": [ { "kind": "function", "name": "SeedOssAttention.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "SeedOssAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SeedOssAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 14, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.seed_oss.SeedOssForCausalLM", "methods": [ { "kind": "function", "name": "SeedOssForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SeedOssForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SeedOssForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SeedOssForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SeedOssForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SeedOssForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SeedOssForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.seed_oss.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.seed_oss.SeedOssModel", "methods": [ { "kind": "function", "name": "SeedOssModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SeedOssModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SeedOssModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SeedOssModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SeedOssModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 12, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.seed_oss", "names": [ "vllm.model_executor.models.seed_oss.SeedOssAttention", "vllm.model_executor.models.seed_oss.SeedOssDecoderLayer", "vllm.model_executor.models.seed_oss.SeedOssForCausalLM", "vllm.model_executor.models.seed_oss.SeedOssMLP", "vllm.model_executor.models.seed_oss.SeedOssModel", "vllm.model_executor.models.seed_oss.logger" ], "n_typable": 92, "n_typed": 54, "n_any": 0, "n_untyped": 38, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 43, "n_classes": 5, "n_attrs": 35, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/siglip.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipProcessingInfo", "methods": [ { "kind": "function", "name": "SiglipProcessingInfo.get_hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SiglipProcessingInfo.get_vision_encoder_info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SiglipProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SiglipProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SiglipProcessingInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SiglipProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SiglipProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 7, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipEncoderInfo", "methods": [ { "kind": "function", "name": "SiglipEncoderInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SiglipEncoderInfo.get_image_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SiglipEncoderInfo.get_patch_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SiglipEncoderInfo.get_patch_grid_length", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipMultiModalProcessor", "methods": [ { "kind": "function", "name": "SiglipMultiModalProcessor.apply", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SiglipMultiModalProcessor._hf_processor_applies_updates", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SiglipMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SiglipMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "SiglipMultiModalProcessor.image_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipAttention", "methods": [ { "kind": "function", "name": "SiglipAttention.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SiglipAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.num_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 7, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipEmbeddingModel", "methods": [ { "kind": "function", "name": "SiglipEmbeddingModel.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SiglipEmbeddingModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SiglipEmbeddingModel.get_text_features", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SiglipEmbeddingModel._flip_sequences_by_position_ids", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SiglipEmbeddingModel.get_image_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SiglipEmbeddingModel._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SiglipEmbeddingModel._process_image_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SiglipEmbeddingModel._embed_text_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SiglipEmbeddingModel.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SiglipEmbeddingModel.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SiglipEmbeddingModel.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "SiglipEmbeddingModel.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipEmbeddingModel.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SiglipEmbeddingModel.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SiglipEmbeddingModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEmbeddingModel.text_embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEmbeddingModel.vision_embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEmbeddingModel.text_projection_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEmbeddingModel.pooler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEmbeddingModel.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEmbeddingModel.text_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEmbeddingModel.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 48, "n_typed": 38, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 28, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SiglipImagePixelInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.siglip.maybe_swap_ffn_param", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipVisionEmbeddings", "methods": [ { "kind": "function", "name": "SiglipVisionEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SiglipVisionEmbeddings.interpolate_pos_encoding", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SiglipVisionEmbeddings.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipVisionEmbeddings.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.num_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionEmbeddings.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 8, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipEncoder", "methods": [ { "kind": "function", "name": "SiglipEncoder.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "SiglipEncoder.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipEncoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEncoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 9, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipTextTransformer", "methods": [ { "kind": "function", "name": "SiglipTextTransformer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SiglipTextTransformer.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SiglipTextTransformer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SiglipTextTransformer.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipTextTransformer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipTextTransformer.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipTextTransformer.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipTextTransformer.final_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipTextTransformer.head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipVisionModel", "methods": [ { "kind": "function", "name": "SiglipVisionModel.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "SiglipVisionModel.get_input_embeddings", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SiglipVisionModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SiglipVisionModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "SiglipVisionModel.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "SiglipVisionModel.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "SiglipVisionModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionModel.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 15, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 2, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipDummyInputsBuilder", "methods": [ { "kind": "function", "name": "SiglipDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SiglipDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipEncoderLayer", "methods": [ { "kind": "function", "name": "SiglipEncoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SiglipEncoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipEncoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEncoderLayer.layer_norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipEncoderLayer.layer_norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipVisionTransformer", "methods": [ { "kind": "function", "name": "SiglipVisionTransformer.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "SiglipVisionTransformer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SiglipVisionTransformer.maybe_layer_norm_and_apply_head", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SiglipVisionTransformer.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "SiglipVisionTransformer.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "SiglipVisionTransformer.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "SiglipVisionTransformer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionTransformer.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionTransformer.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionTransformer.head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionTransformer.last_hs_proc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionTransformer.post_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipVisionTransformer.use_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 16, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 7, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipMLP", "methods": [ { "kind": "function", "name": "SiglipMLP.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SiglipMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipMLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipMLP.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipTextEmbeddings", "methods": [ { "kind": "function", "name": "SiglipTextEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SiglipTextEmbeddings.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipTextEmbeddings.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipTextEmbeddings.token_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipTextEmbeddings.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 5, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip.SiglipMultiheadAttentionPoolingHead", "methods": [ { "kind": "function", "name": "SiglipMultiheadAttentionPoolingHead.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SiglipMultiheadAttentionPoolingHead.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipMultiheadAttentionPoolingHead.probe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipMultiheadAttentionPoolingHead.attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipMultiheadAttentionPoolingHead.layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SiglipMultiheadAttentionPoolingHead.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.siglip", "names": [ "vllm.model_executor.models.siglip.SiglipAttention", "vllm.model_executor.models.siglip.SiglipDummyInputsBuilder", "vllm.model_executor.models.siglip.SiglipEmbeddingModel", "vllm.model_executor.models.siglip.SiglipEncoder", "vllm.model_executor.models.siglip.SiglipEncoderInfo", "vllm.model_executor.models.siglip.SiglipEncoderLayer", "vllm.model_executor.models.siglip.SiglipImagePixelInputs", "vllm.model_executor.models.siglip.SiglipMLP", "vllm.model_executor.models.siglip.SiglipMultiModalProcessor", "vllm.model_executor.models.siglip.SiglipMultiheadAttentionPoolingHead", "vllm.model_executor.models.siglip.SiglipProcessingInfo", "vllm.model_executor.models.siglip.SiglipTextEmbeddings", "vllm.model_executor.models.siglip.SiglipTextTransformer", "vllm.model_executor.models.siglip.SiglipVisionEmbeddings", "vllm.model_executor.models.siglip.SiglipVisionModel", "vllm.model_executor.models.siglip.SiglipVisionTransformer", "vllm.model_executor.models.siglip.maybe_swap_ffn_param" ], "n_typable": 241, "n_typed": 172, "n_any": 0, "n_untyped": 69, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 5, "n_methods": 56, "n_method_overloads": 56, "n_method_params": 114, "n_classes": 16, "n_attrs": 62, "n_properties": 5, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/siglip2navit.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.siglip2navit.VisionRotaryEmbedding", "methods": [ { "kind": "function", "name": "VisionRotaryEmbedding.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VisionRotaryEmbedding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip2navit.Siglip2VisionEmbeddings", "methods": [ { "kind": "function", "name": "Siglip2VisionEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Siglip2VisionEmbeddings.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2VisionEmbeddings.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionEmbeddings.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionEmbeddings.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionEmbeddings.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionEmbeddings.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionEmbeddings.preserve_original_pe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionEmbeddings.hidden_stride", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionEmbeddings.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionEmbeddings.position_embedding_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionEmbeddings.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 4, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip2navit.Siglip2Encoder", "methods": [ { "kind": "function", "name": "Siglip2Encoder.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Siglip2Encoder.rot_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Siglip2Encoder.get_window_index", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Siglip2Encoder.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2Encoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Encoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Encoder.rotary_pos_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Encoder.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Encoder.hidden_stride", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Encoder.window_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Encoder.spatial_merge_unit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Encoder.fullatt_block_indexes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 6, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip2navit.Siglip2MLP", "methods": [ { "kind": "function", "name": "Siglip2MLP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Siglip2MLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2MLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2MLP.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2MLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2MLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.siglip2navit.apply_rotary_pos_emb", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "class", "name": "vllm.model_executor.models.siglip2navit.Siglip2Attention", "methods": [ { "kind": "function", "name": "Siglip2Attention.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Siglip2Attention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2Attention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.num_heads_per_partition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.use_rope", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2Attention.apply_rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 7, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip2navit.Siglip2EncoderLayer", "methods": [ { "kind": "function", "name": "Siglip2EncoderLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Siglip2EncoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2EncoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2EncoderLayer.layer_norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2EncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2EncoderLayer.layer_norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2EncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 7, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip2navit.Siglip2NavitModel", "methods": [ { "kind": "function", "name": "Siglip2NavitModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Siglip2NavitModel.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Siglip2NavitModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2NavitModel.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.siglip2navit.Siglip2VisionTransformer", "methods": [ { "kind": "function", "name": "Siglip2VisionTransformer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Siglip2VisionTransformer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Siglip2VisionTransformer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionTransformer.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionTransformer.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Siglip2VisionTransformer.post_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.siglip2navit", "names": [ "vllm.model_executor.models.siglip2navit.Siglip2Attention", "vllm.model_executor.models.siglip2navit.Siglip2Encoder", "vllm.model_executor.models.siglip2navit.Siglip2EncoderLayer", "vllm.model_executor.models.siglip2navit.Siglip2MLP", "vllm.model_executor.models.siglip2navit.Siglip2NavitModel", "vllm.model_executor.models.siglip2navit.Siglip2VisionEmbeddings", "vllm.model_executor.models.siglip2navit.Siglip2VisionTransformer", "vllm.model_executor.models.siglip2navit.VisionRotaryEmbedding", "vllm.model_executor.models.siglip2navit.apply_rotary_pos_emb" ], "n_typable": 111, "n_typed": 55, "n_any": 0, "n_untyped": 56, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 6, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 40, "n_classes": 8, "n_attrs": 45, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/skyworkr1v.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.skyworkr1v.SkyworkR1VImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SkyworkR1VImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VImagePixelInputs.pixel_values_flat", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VImagePixelInputs.num_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.skyworkr1v.SkyworkR1VImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SkyworkR1VImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.skyworkr1v.build_transform", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.skyworkr1v.IMG_END", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.skyworkr1v.IMG_CONTEXT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.models.skyworkr1v.calculate_skyworkr1v_targets", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.skyworkr1v.SkyworkR1VChatModel", "methods": [ { "kind": "function", "name": "SkyworkR1VChatModel.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SkyworkR1VChatModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SkyworkR1VChatModel._patch_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SkyworkR1VChatModel._init_vision_model", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SkyworkR1VChatModel._init_mlp1", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SkyworkR1VChatModel.pixel_shuffle", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SkyworkR1VChatModel.extract_feature", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SkyworkR1VChatModel._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SkyworkR1VChatModel._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SkyworkR1VChatModel._set_visual_token_mask", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SkyworkR1VChatModel.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SkyworkR1VChatModel.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SkyworkR1VChatModel.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "SkyworkR1VChatModel.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SkyworkR1VChatModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SkyworkR1VChatModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VChatModel.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VChatModel.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VChatModel.num_image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VChatModel.downsample_ratio", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VChatModel.ps_version", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VChatModel.is_mono", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VChatModel.img_context_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VChatModel.visual_token_mask", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VChatModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VChatModel.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VChatModel.mlp1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VChatModel.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 59, "n_typed": 41, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 31, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.skyworkr1v.SkyworkR1VProcessingInfo", "methods": [ { "kind": "function", "name": "SkyworkR1VProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SkyworkR1VProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SkyworkR1VProcessingInfo.get_num_image_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SkyworkR1VProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.skyworkr1v.SkyworkR1VMultiModalProcessor", "methods": [ { "kind": "function", "name": "SkyworkR1VMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SkyworkR1VMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SkyworkR1VMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.skyworkr1v.SkyworkR1VProcessor", "methods": [ { "kind": "function", "name": "SkyworkR1VProcessor.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "SkyworkR1VProcessor.get_image_repl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SkyworkR1VProcessor.resolve_min_max_num", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SkyworkR1VProcessor.resolve_target_ratios", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SkyworkR1VProcessor.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SkyworkR1VProcessor._images_to_pixel_values_lst", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SkyworkR1VProcessor.__call__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "SkyworkR1VProcessor.image_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "SkyworkR1VProcessor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VProcessor.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VProcessor.num_image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VProcessor.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VProcessor.min_dynamic_patch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VProcessor.max_dynamic_patch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VProcessor.dynamic_image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SkyworkR1VProcessor.use_thumbnail", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 43, "n_typed": 36, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 27, "n_attrs": 8, "n_properties": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.skyworkr1v.SkyworkR1VImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.models.skyworkr1v.find_closest_aspect_ratio", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.model_executor.models.skyworkr1v.IMAGENET_STD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.models.skyworkr1v.resolve_skyworkr1v_min_max_num", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.model_executor.models.skyworkr1v.IMAGENET_MEAN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.skyworkr1v.IMG_START", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.models.skyworkr1v.dynamic_preprocess_skyworkr1v", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.models.skyworkr1v.get_skyworkr1v_target_ratios", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.skyworkr1v.image_to_pixel_values_skyworkr1v", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.skyworkr1v.SkyworkR1VDummyInputsBuilder", "methods": [ { "kind": "function", "name": "SkyworkR1VDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SkyworkR1VDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.skyworkr1v", "names": [ "vllm.model_executor.models.skyworkr1v.IMAGENET_MEAN", "vllm.model_executor.models.skyworkr1v.IMAGENET_STD", "vllm.model_executor.models.skyworkr1v.IMG_CONTEXT", "vllm.model_executor.models.skyworkr1v.IMG_END", "vllm.model_executor.models.skyworkr1v.IMG_START", "vllm.model_executor.models.skyworkr1v.SkyworkR1VChatModel", "vllm.model_executor.models.skyworkr1v.SkyworkR1VDummyInputsBuilder", "vllm.model_executor.models.skyworkr1v.SkyworkR1VImageEmbeddingInputs", "vllm.model_executor.models.skyworkr1v.SkyworkR1VImageInputs", "vllm.model_executor.models.skyworkr1v.SkyworkR1VImagePixelInputs", "vllm.model_executor.models.skyworkr1v.SkyworkR1VMultiModalProcessor", "vllm.model_executor.models.skyworkr1v.SkyworkR1VProcessingInfo", "vllm.model_executor.models.skyworkr1v.SkyworkR1VProcessor", "vllm.model_executor.models.skyworkr1v.build_transform", "vllm.model_executor.models.skyworkr1v.calculate_skyworkr1v_targets", "vllm.model_executor.models.skyworkr1v.dynamic_preprocess_skyworkr1v", "vllm.model_executor.models.skyworkr1v.find_closest_aspect_ratio", "vllm.model_executor.models.skyworkr1v.get_skyworkr1v_target_ratios", "vllm.model_executor.models.skyworkr1v.image_to_pixel_values_skyworkr1v", "vllm.model_executor.models.skyworkr1v.resolve_skyworkr1v_min_max_num" ], "n_typable": 167, "n_typed": 141, "n_any": 0, "n_untyped": 26, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 26, "n_methods": 31, "n_method_overloads": 31, "n_method_params": 75, "n_classes": 7, "n_attrs": 32, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/smolvlm.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.smolvlm.SmolVLMForConditionalGeneration", "methods": [ { "kind": "function", "name": "SmolVLMForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.smolvlm.SmolVLMProcessingInfo", "methods": [ { "kind": "function", "name": "SmolVLMProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SmolVLMProcessingInfo._get_image_token", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.smolvlm", "names": [ "vllm.model_executor.models.smolvlm.SmolVLMForConditionalGeneration", "vllm.model_executor.models.smolvlm.SmolVLMProcessingInfo" ], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_classes": 2, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/solar.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.solar.SolarForCausalLM", "methods": [ { "kind": "function", "name": "SolarForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SolarForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SolarForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SolarForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SolarForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SolarForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SolarForCausalLM.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SolarForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.solar.SolarDecoderLayer", "methods": [ { "kind": "function", "name": "SolarDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SolarDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SolarDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.solar.SolarModel", "methods": [ { "kind": "function", "name": "SolarModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SolarModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SolarModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SolarModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SolarModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.solar.SolarAttention", "methods": [ { "kind": "function", "name": "SolarAttention.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "SolarAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SolarAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 13, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.solar.SolarMLP", "methods": [ { "kind": "function", "name": "SolarMLP.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "SolarMLP.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SolarMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SolarMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.solar", "names": [ "vllm.model_executor.models.solar.SolarAttention", "vllm.model_executor.models.solar.SolarDecoderLayer", "vllm.model_executor.models.solar.SolarForCausalLM", "vllm.model_executor.models.solar.SolarMLP", "vllm.model_executor.models.solar.SolarModel" ], "n_typable": 91, "n_typed": 53, "n_any": 0, "n_untyped": 38, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 42, "n_classes": 5, "n_attrs": 36, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/stablelm.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.stablelm.StablelmAttention", "methods": [ { "kind": "function", "name": "StablelmAttention.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "StablelmAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StablelmAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmAttention.total_num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmAttention.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmAttention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmAttention.qkv_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 8, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 16, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.stablelm.StablelmMLP", "methods": [ { "kind": "function", "name": "StablelmMLP.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "StablelmMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StablelmMLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmMLP.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmMLP.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 6, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.stablelm.StableLMEpochModel", "methods": [ { "kind": "function", "name": "StableLMEpochModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StableLMEpochModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StableLMEpochModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "StableLMEpochModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StableLMEpochModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StableLMEpochModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StableLMEpochModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 11, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.stablelm.StablelmDecoderLayer", "methods": [ { "kind": "function", "name": "StablelmDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "StablelmDecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StablelmDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.stablelm.StablelmForCausalLM", "methods": [ { "kind": "function", "name": "StablelmForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StablelmForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StablelmForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "StablelmForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StablelmForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StablelmForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StablelmForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.stablelm", "names": [ "vllm.model_executor.models.stablelm.StableLMEpochModel", "vllm.model_executor.models.stablelm.StablelmAttention", "vllm.model_executor.models.stablelm.StablelmDecoderLayer", "vllm.model_executor.models.stablelm.StablelmForCausalLM", "vllm.model_executor.models.stablelm.StablelmMLP" ], "n_typable": 83, "n_typed": 46, "n_any": 0, "n_untyped": 37, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 33, "n_classes": 5, "n_attrs": 35, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/starcoder2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.starcoder2.Starcoder2ForCausalLM", "methods": [ { "kind": "function", "name": "Starcoder2ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Starcoder2ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Starcoder2ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Starcoder2ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Starcoder2ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Starcoder2ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2ForCausalLM.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.starcoder2.Starcoder2Model", "methods": [ { "kind": "function", "name": "Starcoder2Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Starcoder2Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Starcoder2Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Starcoder2Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Starcoder2Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.starcoder2.Starcoder2Attention", "methods": [ { "kind": "function", "name": "Starcoder2Attention.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Starcoder2Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Starcoder2Attention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Attention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Attention.use_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 7, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 16, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.starcoder2.Starcoder2MLP", "methods": [ { "kind": "function", "name": "Starcoder2MLP.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Starcoder2MLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Starcoder2MLP.c_fc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2MLP.c_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2MLP.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 5, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.starcoder2.Starcoder2DecoderLayer", "methods": [ { "kind": "function", "name": "Starcoder2DecoderLayer.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Starcoder2DecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Starcoder2DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Starcoder2DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 7, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.starcoder2", "names": [ "vllm.model_executor.models.starcoder2.Starcoder2Attention", "vllm.model_executor.models.starcoder2.Starcoder2DecoderLayer", "vllm.model_executor.models.starcoder2.Starcoder2ForCausalLM", "vllm.model_executor.models.starcoder2.Starcoder2MLP", "vllm.model_executor.models.starcoder2.Starcoder2Model" ], "n_typable": 83, "n_typed": 43, "n_any": 0, "n_untyped": 40, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 33, "n_classes": 5, "n_attrs": 35, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/step1.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.step1.STEP_PACKED_MODULES_MAPPING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step1.Step1ForCausalLM", "methods": [ { "kind": "function", "name": "Step1ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step1ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step1ForCausalLM.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Step1ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step1ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step1ForCausalLM.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Step1ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step1ForCausalLM.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step1ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step1ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step1ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step1ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step1.StepDecoderModel", "methods": [ { "kind": "function", "name": "StepDecoderModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StepDecoderModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StepDecoderModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StepDecoderModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepDecoderModel.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepDecoderModel.aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StepDecoderModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepDecoderModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepDecoderModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 10, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step1.StepDecoderLayer", "methods": [ { "kind": "function", "name": "StepDecoderLayer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StepDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "StepDecoderLayer.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StepDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 8, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step1.StepAttention", "methods": [ { "kind": "function", "name": "StepAttention.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "StepAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StepAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepAttention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 5, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step1.StepMLP", "methods": [ { "kind": "function", "name": "StepMLP.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "StepMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StepMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.step1", "names": [ "vllm.model_executor.models.step1.STEP_PACKED_MODULES_MAPPING", "vllm.model_executor.models.step1.Step1ForCausalLM", "vllm.model_executor.models.step1.StepAttention", "vllm.model_executor.models.step1.StepDecoderLayer", "vllm.model_executor.models.step1.StepDecoderModel", "vllm.model_executor.models.step1.StepMLP" ], "n_typable": 80, "n_typed": 43, "n_any": 0, "n_untyped": 37, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 33, "n_classes": 5, "n_attrs": 34, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/step3_text.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.step3_text.FusedMoEBlock", "methods": [ { "kind": "function", "name": "FusedMoEBlock.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FusedMoEBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FusedMoEBlock.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 5, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3_text.Step3TextDecoderLayer", "methods": [ { "kind": "function", "name": "Step3TextDecoderLayer.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Step3TextDecoderLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3TextDecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextDecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextDecoderLayer.moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextDecoderLayer.share_expert", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextDecoderLayer.use_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 9, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3_text.Step3TextAttention", "methods": [ { "kind": "function", "name": "Step3TextAttention.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "Step3TextAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3TextAttention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextAttention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextAttention.inter_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextAttention.wq", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextAttention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 14, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 13, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3_text.Step3TextModel", "methods": [ { "kind": "function", "name": "Step3TextModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3TextModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3TextModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3TextModel.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextModel.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextModel.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3_text.Step3TextMLP", "methods": [ { "kind": "function", "name": "Step3TextMLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Step3TextMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3TextMLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextMLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextMLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextMLP.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.step3_text.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.step3_text.Step3TextForCausalLM", "methods": [ { "kind": "function", "name": "Step3TextForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3TextForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3TextForCausalLM.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Step3TextForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3TextForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3TextForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 12, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.step3_text", "names": [ "vllm.model_executor.models.step3_text.FusedMoEBlock", "vllm.model_executor.models.step3_text.Step3TextAttention", "vllm.model_executor.models.step3_text.Step3TextDecoderLayer", "vllm.model_executor.models.step3_text.Step3TextForCausalLM", "vllm.model_executor.models.step3_text.Step3TextMLP", "vllm.model_executor.models.step3_text.Step3TextModel", "vllm.model_executor.models.step3_text.logger" ], "n_typable": 102, "n_typed": 58, "n_any": 0, "n_untyped": 44, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 46, "n_classes": 6, "n_attrs": 40, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/step3_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.step3_vl.Step3VisionEmbeddings", "methods": [ { "kind": "function", "name": "Step3VisionEmbeddings.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3VisionEmbeddings.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3VisionEmbeddings.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEmbeddings.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEmbeddings.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEmbeddings.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEmbeddings.class_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEmbeddings.patch_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEmbeddings.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEmbeddings.pad_tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEmbeddings.position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 3, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 9, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.step3_vl.Step3VLImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.step3_vl.Step3VisionAttention", "methods": [ { "kind": "function", "name": "Step3VisionAttention.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Step3VisionAttention.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3VisionAttention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 3, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3_vl.Step3VisionMLP", "methods": [ { "kind": "function", "name": "Step3VisionMLP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Step3VisionMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3VisionMLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionMLP.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 4, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.step3_vl.MAX_IMAGE_SIZE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.step3_vl.Step3VLMultiModalProcessor", "methods": [ { "kind": "function", "name": "Step3VLMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Step3VLMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3_vl.Step3VLProcessingInfo", "methods": [ { "kind": "function", "name": "Step3VLProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Step3VLProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Step3VLProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Step3VLProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3VLProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Step3VLProcessingInfo.get_num_mm_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3_vl.Step3VisionTransformer", "methods": [ { "kind": "function", "name": "Step3VisionTransformer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Step3VisionTransformer.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3VisionTransformer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionTransformer.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionTransformer.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionTransformer.embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionTransformer.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 4, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3_vl.Step3VisionProcessor", "methods": [ { "kind": "function", "name": "Step3VisionProcessor.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Step3VisionProcessor.__call__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3VisionProcessor.transform", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionProcessor.patch_transform", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 0, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3_vl.Step3VLProcessor", "methods": [ { "kind": "function", "name": "Step3VLProcessor.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3VLProcessor.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3VLProcessor._split_images", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3VLProcessor._convert_images_to_pixel_values", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3VLProcessor._get_patch_repl", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3VLProcessor._get_image_repl", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3VLProcessor._get_image_repl_features", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Step3VLProcessor.replace_placeholder", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Step3VLProcessor.__call__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "Step3VLProcessor.image_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Step3VLProcessor.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLProcessor.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLProcessor.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLProcessor.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLProcessor.image_preprocessor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLProcessor.num_image_feature_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLProcessor.num_patch_feature_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLProcessor.image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLProcessor.image_feature_placeholder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLProcessor.patch_feature_placeholder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLProcessor.patcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 29, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 19, "n_attrs": 11, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.step3_vl.Step3VLForConditionalGeneration", "methods": [ { "kind": "function", "name": "Step3VLForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3VLForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3VLForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3VLForConditionalGeneration._process_image_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3VLForConditionalGeneration._get_vision_model_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3VLForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3VLForConditionalGeneration.embed_multimodal", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3VLForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Step3VLForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Step3VLForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3VLForConditionalGeneration.load_weights", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Step3VLForConditionalGeneration.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "Step3VLForConditionalGeneration.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Step3VLForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLForConditionalGeneration.supports_encoder_tp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Step3VLForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLForConditionalGeneration.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLForConditionalGeneration.vit_downsampler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLForConditionalGeneration.vit_downsampler2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLForConditionalGeneration.vit_large_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 43, "n_typed": 29, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 20, "n_attrs": 11, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.step3_vl.Step3VLImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3VLImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.step3_vl.ImageWithPatches", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3_vl.ImagePatcher", "methods": [ { "kind": "function", "name": "ImagePatcher.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ImagePatcher.determine_window_size", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ImagePatcher.slide_window", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ImagePatcher.square_pad", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ImagePatcher.get_image_size_for_padding", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ImagePatcher.get_image_size_for_preprocess", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ImagePatcher.get_image_size_for_crop", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ImagePatcher.patch_crop", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ImagePatcher.get_num_patches", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ImagePatcher.__call__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ImagePatcher.enable_patch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 32, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 24, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.step3_vl.get_abs_pos", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.step3_vl.Step3VLImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3VLImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLImagePixelInputs.patch_pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLImagePixelInputs.num_patches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3_vl.Step3VLDummyInputsBuilder", "methods": [ { "kind": "function", "name": "Step3VLDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3VLDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3_vl.Step3VisionEncoderLayer", "methods": [ { "kind": "function", "name": "Step3VisionEncoderLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Step3VisionEncoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3VisionEncoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEncoderLayer.layer_norm1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEncoderLayer.layer_norm2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 5, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3_vl.Step3VisionEncoder", "methods": [ { "kind": "function", "name": "Step3VisionEncoder.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Step3VisionEncoder.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3VisionEncoder.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEncoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 3, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.step3_vl", "names": [ "vllm.model_executor.models.step3_vl.ImagePatcher", "vllm.model_executor.models.step3_vl.ImageWithPatches", "vllm.model_executor.models.step3_vl.MAX_IMAGE_SIZE", "vllm.model_executor.models.step3_vl.Step3VLDummyInputsBuilder", "vllm.model_executor.models.step3_vl.Step3VLForConditionalGeneration", "vllm.model_executor.models.step3_vl.Step3VLImageEmbeddingInputs", "vllm.model_executor.models.step3_vl.Step3VLImageInputs", "vllm.model_executor.models.step3_vl.Step3VLImagePixelInputs", "vllm.model_executor.models.step3_vl.Step3VLMultiModalProcessor", "vllm.model_executor.models.step3_vl.Step3VLProcessingInfo", "vllm.model_executor.models.step3_vl.Step3VLProcessor", "vllm.model_executor.models.step3_vl.Step3VisionAttention", "vllm.model_executor.models.step3_vl.Step3VisionEmbeddings", "vllm.model_executor.models.step3_vl.Step3VisionEncoder", "vllm.model_executor.models.step3_vl.Step3VisionEncoderLayer", "vllm.model_executor.models.step3_vl.Step3VisionMLP", "vllm.model_executor.models.step3_vl.Step3VisionProcessor", "vllm.model_executor.models.step3_vl.Step3VisionTransformer", "vllm.model_executor.models.step3_vl.get_abs_pos" ], "n_typable": 229, "n_typed": 142, "n_any": 0, "n_untyped": 87, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 54, "n_method_overloads": 54, "n_method_params": 102, "n_classes": 15, "n_attrs": 69, "n_properties": 3, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/step3p5.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.step3p5.get_spec_layer_idx_from_weight_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.step3p5.FP32ReplicatedLinear", "methods": [ { "kind": "function", "name": "FP32ReplicatedLinear.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3p5.Step3p5Attention", "methods": [ { "kind": "function", "name": "Step3p5Attention.__init__", "n_typed": 20, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 21, "n_params": 20, "n_function_overloads": 1, "n_function_params": 20 }, { "kind": "function", "name": "Step3p5Attention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3p5Attention.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.partial_rotary_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.total_num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.rope_theta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.q_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.k_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.use_head_wise_attn_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.use_rope", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.rotary_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Attention.g_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 48, "n_typed": 23, "n_any": 0, "n_untyped": 25, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 22, "n_attrs": 24, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3p5.Step3p5ForCausalLM", "methods": [ { "kind": "function", "name": "Step3p5ForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3p5ForCausalLM.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Step3p5ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3p5ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3p5ForCausalLM.set_eplb_state", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Step3p5ForCausalLM.update_physical_experts_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3p5ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3p5ForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ForCausalLM.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ForCausalLM.moe_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ForCausalLM.expert_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ForCausalLM.num_moe_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ForCausalLM.num_expert_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ForCausalLM.num_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ForCausalLM.num_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ForCausalLM.num_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ForCausalLM.num_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ForCausalLM.num_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ForCausalLM.num_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 36, "n_typed": 20, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 14, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3p5.Step3p5MLP", "methods": [ { "kind": "function", "name": "Step3p5MLP.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Step3p5MLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3p5MLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5MLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5MLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5MLP.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5MLP.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5MLP.limit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 10, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3p5.Step3p5DecoderLayer", "methods": [ { "kind": "function", "name": "Step3p5DecoderLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3p5DecoderLayer.add_and_maybe_inplace_all_reduce", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3p5DecoderLayer.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3p5DecoderLayer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5DecoderLayer.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5DecoderLayer.use_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5DecoderLayer.tp_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5DecoderLayer.use_fused_all_reduce", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5DecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5DecoderLayer.post_attention_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5DecoderLayer.prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5DecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5DecoderLayer.moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5DecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 9, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 11, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.step3p5.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.step3p5.Step3p5Model", "methods": [ { "kind": "function", "name": "Step3p5Model.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3p5Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3p5Model.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Step3p5Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3p5Model.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Model.moe_num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Model.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Model.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 12, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3p5.FusedMoEBlock", "methods": [ { "kind": "function", "name": "FusedMoEBlock.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FusedMoEBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FusedMoEBlock.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.ep_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.enable_eplb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.n_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.n_logical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.n_redundant_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.n_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.n_local_physical_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.physical_expert_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.physical_expert_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.use_moe_router_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.router_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.need_fp32_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.share_expert", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FusedMoEBlock.experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 4, "n_any": 0, "n_untyped": 21, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 20, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.step3p5", "names": [ "vllm.model_executor.models.step3p5.FP32ReplicatedLinear", "vllm.model_executor.models.step3p5.FusedMoEBlock", "vllm.model_executor.models.step3p5.Step3p5Attention", "vllm.model_executor.models.step3p5.Step3p5DecoderLayer", "vllm.model_executor.models.step3p5.Step3p5ForCausalLM", "vllm.model_executor.models.step3p5.Step3p5MLP", "vllm.model_executor.models.step3p5.Step3p5Model", "vllm.model_executor.models.step3p5.get_spec_layer_idx_from_weight_name", "vllm.model_executor.models.step3p5.logger" ], "n_typable": 170, "n_typed": 83, "n_any": 0, "n_untyped": 87, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 62, "n_classes": 7, "n_attrs": 84, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/step3p5_mtp.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.step3p5_mtp.Step3p5AMultiTokenPredictor", "methods": [ { "kind": "function", "name": "Step3p5AMultiTokenPredictor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3p5AMultiTokenPredictor.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Step3p5AMultiTokenPredictor.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3p5AMultiTokenPredictor.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3p5AMultiTokenPredictor.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5AMultiTokenPredictor.mtp_start_layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5AMultiTokenPredictor.num_mtp_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5AMultiTokenPredictor.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5AMultiTokenPredictor.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 13, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3p5_mtp.Step3p5AMultiTokenPredictorLayer", "methods": [ { "kind": "function", "name": "Step3p5AMultiTokenPredictorLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3p5AMultiTokenPredictorLayer.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3p5AMultiTokenPredictorLayer.enorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5AMultiTokenPredictorLayer.hnorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5AMultiTokenPredictorLayer.eh_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5AMultiTokenPredictorLayer.shared_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5AMultiTokenPredictorLayer.mtp_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3p5_mtp.SharedHead", "methods": [ { "kind": "function", "name": "SharedHead.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SharedHead.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SharedHead.norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SharedHead.head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step3p5_mtp.Step3p5MTP", "methods": [ { "kind": "function", "name": "Step3p5MTP.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3p5MTP.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3p5MTP.forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Step3p5MTP.compute_logits", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3p5MTP.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3p5MTP._rewrite_spec_layer_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3p5MTP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5MTP.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5MTP.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 19, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.step3p5_mtp.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.step3p5_mtp", "names": [ "vllm.model_executor.models.step3p5_mtp.SharedHead", "vllm.model_executor.models.step3p5_mtp.Step3p5AMultiTokenPredictor", "vllm.model_executor.models.step3p5_mtp.Step3p5AMultiTokenPredictorLayer", "vllm.model_executor.models.step3p5_mtp.Step3p5MTP", "vllm.model_executor.models.step3p5_mtp.logger" ], "n_typable": 64, "n_typed": 46, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 34, "n_classes": 4, "n_attrs": 16, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/step_vl.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.step_vl.apply_rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.model_executor.models.step_vl.PerceptionEncoderVisionBlock", "methods": [ { "kind": "function", "name": "PerceptionEncoderVisionBlock.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "PerceptionEncoderVisionBlock.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PerceptionEncoderVisionBlock.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderVisionBlock.ls_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderVisionBlock.ls_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderVisionBlock.ln_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderVisionBlock.ln_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderVisionBlock.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 13, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 13, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step_vl.PerceptionEncoderRope2D", "methods": [ { "kind": "function", "name": "PerceptionEncoderRope2D.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "PerceptionEncoderRope2D._compute_inv_freq", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PerceptionEncoderRope2D._compute_freqs", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PerceptionEncoderRope2D._compute_2d_freqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PerceptionEncoderRope2D.forward", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PerceptionEncoderRope2D.dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderRope2D.max_grid_height", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderRope2D.max_grid_width", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderRope2D.use_cls_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderRope2D.theta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderRope2D.max_freq", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderRope2D.num_freqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 13, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 15, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step_vl.PerceptionEncoder", "methods": [ { "kind": "function", "name": "PerceptionEncoder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PerceptionEncoder.sample_abs_posemb", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PerceptionEncoder.forward_features", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PerceptionEncoder.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PerceptionEncoder.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.output_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.width", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.use_abs_posemb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.use_cls_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.use_rope2d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.conv1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.ln_pre", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.ln_post", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.vit_downsampler1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.vit_downsampler2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.class_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.posemb_grid_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoder.positional_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 8, "n_any": 0, "n_untyped": 23, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step_vl.PerceptionEncoderLayerScale", "methods": [ { "kind": "function", "name": "PerceptionEncoderLayerScale.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PerceptionEncoderLayerScale.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PerceptionEncoderLayerScale.inplace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderLayerScale.gamma", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step_vl.PerceptionEncoderVisionTransformer", "methods": [ { "kind": "function", "name": "PerceptionEncoderVisionTransformer.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "PerceptionEncoderVisionTransformer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PerceptionEncoderVisionTransformer.width", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderVisionTransformer.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderVisionTransformer.resblocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 14, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 14, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step_vl.PerceptionEncoderMLP", "methods": [ { "kind": "function", "name": "PerceptionEncoderMLP.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PerceptionEncoderMLP.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PerceptionEncoderMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderMLP.activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step_vl.StepVLForConditionalGeneration", "methods": [ { "kind": "function", "name": "StepVLForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StepVLForConditionalGeneration._get_vision_model_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StepVLForConditionalGeneration._process_image_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StepVLForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepVLForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepVLForConditionalGeneration.multimodal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepVLForConditionalGeneration.use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepVLForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepVLForConditionalGeneration.vision_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepVLForConditionalGeneration.vit_large_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StepVLForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 7, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.step_vl.PerceptionEncoderVisionAttention", "methods": [ { "kind": "function", "name": "PerceptionEncoderVisionAttention.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "PerceptionEncoderVisionAttention.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PerceptionEncoderVisionAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderVisionAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderVisionAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderVisionAttention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderVisionAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderVisionAttention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderVisionAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderVisionAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerceptionEncoderVisionAttention.rope", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 10, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 9, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.step_vl.rotate_half", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.step_vl", "names": [ "vllm.model_executor.models.step_vl.PerceptionEncoder", "vllm.model_executor.models.step_vl.PerceptionEncoderLayerScale", "vllm.model_executor.models.step_vl.PerceptionEncoderMLP", "vllm.model_executor.models.step_vl.PerceptionEncoderRope2D", "vllm.model_executor.models.step_vl.PerceptionEncoderVisionAttention", "vllm.model_executor.models.step_vl.PerceptionEncoderVisionBlock", "vllm.model_executor.models.step_vl.PerceptionEncoderVisionTransformer", "vllm.model_executor.models.step_vl.StepVLForConditionalGeneration", "vllm.model_executor.models.step_vl.apply_rotary_emb", "vllm.model_executor.models.step_vl.rotate_half" ], "n_typable": 160, "n_typed": 72, "n_any": 0, "n_untyped": 88, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 6, "n_methods": 22, "n_method_overloads": 22, "n_method_params": 74, "n_classes": 8, "n_attrs": 56, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/tarsier.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.tarsier.TarsierImageEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TarsierImageEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TarsierImageEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.tarsier.TarsierProcessorKwargs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TarsierProcessorKwargs._defaults", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.tarsier.init_vision_tower_for_tarsier", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.tarsier.TarsierProcessor", "methods": [ { "kind": "function", "name": "TarsierProcessor.__call__", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.tarsier.TarsierHfConfig", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.tarsier.TarsierMultiModalProcessor", "methods": [ { "kind": "function", "name": "TarsierMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TarsierMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.tarsier.TarsierDummyInputsBuilder", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.tarsier.TarsierImagePixelInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TarsierImagePixelInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TarsierImagePixelInputs.pixel_values", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.tarsier.TarsierProcessingInfo", "methods": [ { "kind": "function", "name": "TarsierProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TarsierProcessingInfo.get_vision_encoder_info", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TarsierProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TarsierProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TarsierProcessingInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TarsierProcessingInfo.get_image_size_with_most_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TarsierProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TarsierProcessingInfo.get_image_newline_idx", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TarsierProcessingInfo.get_image_new_idx", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.tarsier.TarsierMultiModalProjector", "methods": [ { "kind": "function", "name": "TarsierMultiModalProjector.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "TarsierMultiModalProjector.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TarsierMultiModalProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TarsierMultiModalProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TarsierMultiModalProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.tarsier.TarsierImageInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.tarsier.TarsierForConditionalGeneration", "methods": [ { "kind": "function", "name": "TarsierForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TarsierForConditionalGeneration.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TarsierForConditionalGeneration._parse_and_validate_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TarsierForConditionalGeneration._image_pixels_to_features", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TarsierForConditionalGeneration._add_tarsier_split_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TarsierForConditionalGeneration._process_image_pixels", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TarsierForConditionalGeneration._process_image_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TarsierForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TarsierForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "TarsierForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TarsierForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TarsierForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TarsierForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TarsierForConditionalGeneration.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TarsierForConditionalGeneration.vision_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TarsierForConditionalGeneration.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TarsierForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 29, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 18, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.tarsier", "names": [ "vllm.model_executor.models.tarsier.TarsierDummyInputsBuilder", "vllm.model_executor.models.tarsier.TarsierForConditionalGeneration", "vllm.model_executor.models.tarsier.TarsierHfConfig", "vllm.model_executor.models.tarsier.TarsierImageEmbeddingInputs", "vllm.model_executor.models.tarsier.TarsierImageInputs", "vllm.model_executor.models.tarsier.TarsierImagePixelInputs", "vllm.model_executor.models.tarsier.TarsierMultiModalProcessor", "vllm.model_executor.models.tarsier.TarsierMultiModalProjector", "vllm.model_executor.models.tarsier.TarsierProcessingInfo", "vllm.model_executor.models.tarsier.TarsierProcessor", "vllm.model_executor.models.tarsier.TarsierProcessorKwargs", "vllm.model_executor.models.tarsier.init_vision_tower_for_tarsier" ], "n_typable": 81, "n_typed": 70, "n_any": 0, "n_untyped": 11, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 25, "n_method_overloads": 25, "n_method_params": 38, "n_classes": 10, "n_attrs": 15, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/telechat2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.telechat2.TeleChat2Model", "methods": [ { "kind": "function", "name": "TeleChat2Model.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TeleChat2Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.telechat2.TeleChat2ForCausalLM", "methods": [ { "kind": "function", "name": "TeleChat2ForCausalLM._init_model", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TeleChat2ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TeleChat2ForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.telechat2", "names": [ "vllm.model_executor.models.telechat2.TeleChat2ForCausalLM", "vllm.model_executor.models.telechat2.TeleChat2Model" ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_classes": 2, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/teleflm.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.teleflm.TeleFLMForCausalLM", "methods": [ { "kind": "function", "name": "TeleFLMForCausalLM.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TeleFLMForCausalLM.use_mup", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TeleFLMForCausalLM.mup_scale_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TeleFLMForCausalLM.output_mult", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TeleFLMForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 2, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.teleflm.TeleFLMModel", "methods": [ { "kind": "function", "name": "TeleFLMModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TeleFLMModel.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TeleFLMModel.use_mup", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TeleFLMModel.input_mult", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.teleflm", "names": [ "vllm.model_executor.models.teleflm.TeleFLMForCausalLM", "vllm.model_executor.models.teleflm.TeleFLMModel" ], "n_typable": 15, "n_typed": 7, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_classes": 2, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/terratorch.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.terratorch.TerratorchMultiModalProcessor", "methods": [ { "kind": "function", "name": "TerratorchMultiModalProcessor._get_mm_fields_config", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TerratorchMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TerratorchMultiModalProcessor.apply", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.terratorch.TerratorchProcessingInfo", "methods": [ { "kind": "function", "name": "TerratorchProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TerratorchProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "TerratorchProcessingInfo.input_definition", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.terratorch.TerratorchMultiModalDataParser", "methods": [ { "kind": "function", "name": "TerratorchMultiModalDataParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TerratorchMultiModalDataParser._parse_image_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TerratorchMultiModalDataParser.parse_mm_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TerratorchMultiModalDataParser.input_definition", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 5, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.terratorch.Terratorch", "methods": [ { "kind": "function", "name": "Terratorch.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Terratorch.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Terratorch.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Terratorch.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Terratorch.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Terratorch.supports_multimodal_raw_input_only", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Terratorch.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Terratorch.inference_runner", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Terratorch.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Terratorch.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 17, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 14, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.terratorch.TerratorchInputBuilder", "methods": [ { "kind": "function", "name": "TerratorchInputBuilder.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TerratorchInputBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TerratorchInputBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TerratorchInputBuilder.dummy_data_generator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.terratorch.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.terratorch", "names": [ "vllm.model_executor.models.terratorch.Terratorch", "vllm.model_executor.models.terratorch.TerratorchInputBuilder", "vllm.model_executor.models.terratorch.TerratorchMultiModalDataParser", "vllm.model_executor.models.terratorch.TerratorchMultiModalProcessor", "vllm.model_executor.models.terratorch.TerratorchProcessingInfo", "vllm.model_executor.models.terratorch.logger" ], "n_typable": 55, "n_typed": 42, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 32, "n_classes": 5, "n_attrs": 8, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/transformers/__init__.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.transformers.TransformersMultiModalEmbeddingModel", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.TransformersMultiModalForSequenceClassification", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.TransformersMoEForCausalLM", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.TransformersForSequenceClassification", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.TransformersEmbeddingModel", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.TransformersMoEEmbeddingModel", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.TransformersForCausalLM", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.TransformersMultiModalForCausalLM", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.TransformersMultiModalMoEForCausalLM", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.TransformersMoEForSequenceClassification", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.transformers", "names": [ "vllm.model_executor.models.transformers.TransformersEmbeddingModel", "vllm.model_executor.models.transformers.TransformersForCausalLM", "vllm.model_executor.models.transformers.TransformersForSequenceClassification", "vllm.model_executor.models.transformers.TransformersMoEEmbeddingModel", "vllm.model_executor.models.transformers.TransformersMoEForCausalLM", "vllm.model_executor.models.transformers.TransformersMoEForSequenceClassification", "vllm.model_executor.models.transformers.TransformersMultiModalEmbeddingModel", "vllm.model_executor.models.transformers.TransformersMultiModalForCausalLM", "vllm.model_executor.models.transformers.TransformersMultiModalForSequenceClassification", "vllm.model_executor.models.transformers.TransformersMultiModalMoEForCausalLM" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 10, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/transformers/base.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.transformers.base.PreTrainedModel", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.transformers.base.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.models.transformers.base.vllm_flash_attention_forward", "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.base.Base", "methods": [ { "kind": "function", "name": "Base.__init_subclass__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Base.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Base.pipeline_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Base.recursive_replace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Base.create_attention_instances", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Base.init_parameters", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Base.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Base.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Base.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Base.check_version", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Base.set_aux_hidden_state_layers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Base.get_eagle3_aux_hidden_state_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Base.embedding_modules", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Base.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Base.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Base.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Base.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Base.device_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Base.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Base.parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Base.quant_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Base.pp_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Base.tp_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Base.skip_prefixes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Base.skip_substrs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Base.ignore_unexpected_prefixes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Base.ignore_unexpected_suffixes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Base.attention_instances", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Base.embed_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Base.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Base.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 46, "n_typed": 24, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 16, "n_attrs": 19, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.transformers.base", "names": [ "vllm.model_executor.models.transformers.base.Base", "vllm.model_executor.models.transformers.base.PreTrainedModel", "vllm.model_executor.models.transformers.base.logger", "vllm.model_executor.models.transformers.base.vllm_flash_attention_forward" ], "n_typable": 56, "n_typed": 31, "n_any": 0, "n_untyped": 25, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 8, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 16, "n_classes": 1, "n_attrs": 21, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/transformers/causal.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.transformers.causal.CausalMixin", "methods": [ { "kind": "function", "name": "CausalMixin.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CausalMixin.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CausalMixin.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CausalMixin.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 4, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.transformers.causal", "names": [ "vllm.model_executor.models.transformers.causal.CausalMixin" ], "n_typable": 7, "n_typed": 4, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/transformers/legacy.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.transformers.legacy.LegacyMixin", "methods": [ { "kind": "function", "name": "LegacyMixin.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LegacyMixin.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LegacyMixin.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LegacyMixin.is_roberta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LegacyMixin.padding_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.transformers.legacy", "names": [ "vllm.model_executor.models.transformers.legacy.LegacyMixin" ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/transformers/moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.transformers.moe.TransformersFusedMoE", "methods": [ { "kind": "function", "name": "TransformersFusedMoE.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TransformersFusedMoE.forward", "n_typed": 4, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 4, "n_any": 1, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.transformers.moe.transformers_moe_forward_fake", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.models.transformers.moe.transformers_moe_forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.moe.MoEMixin", "methods": [ { "kind": "function", "name": "MoEMixin.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoEMixin.set_eplb_state", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MoEMixin.update_physical_experts_metadata", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MoEMixin.get_expert_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MoEMixin.recursive_replace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.transformers.moe", "names": [ "vllm.model_executor.models.transformers.moe.MoEMixin", "vllm.model_executor.models.transformers.moe.TransformersFusedMoE", "vllm.model_executor.models.transformers.moe.transformers_moe_forward", "vllm.model_executor.models.transformers.moe.transformers_moe_forward_fake" ], "n_typable": 30, "n_typed": 22, "n_any": 1, "n_untyped": 7, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 8, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 13, "n_classes": 2, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/transformers/multimodal.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.transformers.multimodal.DYNAMIC_ARG_DIMS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.multimodal.MultiModalDummyInputsBuilder", "methods": [ { "kind": "function", "name": "MultiModalDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.multimodal.MultiModalMixin", "methods": [ { "kind": "function", "name": "MultiModalMixin.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalMixin.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MultiModalMixin.get_language_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiModalMixin.embed_multimodal", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalMixin.get_mrope_input_positions", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalMixin.supports_multimodal_raw_input_only", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModalMixin.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 12, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.multimodal.MultiModalProcessor", "methods": [ { "kind": "function", "name": "MultiModalProcessor._get_prompt_updates", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalProcessor._get_hf_mm_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalProcessor.apply", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.transformers.multimodal.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.multimodal.MultiModalProcessingInfo", "methods": [ { "kind": "function", "name": "MultiModalProcessingInfo.get_supported_mm_limits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiModalProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalProcessingInfo.get_max_image_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiModalProcessingInfo.get_max_image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.transformers.multimodal", "names": [ "vllm.model_executor.models.transformers.multimodal.DYNAMIC_ARG_DIMS", "vllm.model_executor.models.transformers.multimodal.MultiModalDummyInputsBuilder", "vllm.model_executor.models.transformers.multimodal.MultiModalMixin", "vllm.model_executor.models.transformers.multimodal.MultiModalProcessingInfo", "vllm.model_executor.models.transformers.multimodal.MultiModalProcessor", "vllm.model_executor.models.transformers.multimodal.logger" ], "n_typable": 41, "n_typed": 30, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 24, "n_classes": 4, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/transformers/pooling.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.transformers.pooling.SequenceClassificationMixin", "methods": [ { "kind": "function", "name": "SequenceClassificationMixin.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SequenceClassificationMixin.default_seq_pooling_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SequenceClassificationMixin.classifier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SequenceClassificationMixin.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.transformers.pooling.EmbeddingMixin", "methods": [ { "kind": "function", "name": "EmbeddingMixin.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EmbeddingMixin.default_seq_pooling_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EmbeddingMixin.pooler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.transformers.pooling", "names": [ "vllm.model_executor.models.transformers.pooling.EmbeddingMixin", "vllm.model_executor.models.transformers.pooling.SequenceClassificationMixin" ], "n_typable": 9, "n_typed": 4, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_classes": 2, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/transformers/utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.transformers.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.models.transformers.utils.init_on_device_without_buffers", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.transformers.utils.replace_linear_class", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.model_executor.models.transformers.utils.get_feature_request_tip", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.models.transformers.utils.TorchConv", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.models.transformers.utils.can_enable_torch_compile", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.transformers.utils.replace_rms_norm_class", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.transformers.utils.log_replacement", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.model_executor.models.transformers.utils.VllmConv", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.model_executor.models.transformers.utils.replace_conv_class", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.transformers.utils.Style", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.transformers.utils", "names": [ "vllm.model_executor.models.transformers.utils.Style", "vllm.model_executor.models.transformers.utils.TorchConv", "vllm.model_executor.models.transformers.utils.VllmConv", "vllm.model_executor.models.transformers.utils.can_enable_torch_compile", "vllm.model_executor.models.transformers.utils.get_feature_request_tip", "vllm.model_executor.models.transformers.utils.init_on_device_without_buffers", "vllm.model_executor.models.transformers.utils.log_replacement", "vllm.model_executor.models.transformers.utils.logger", "vllm.model_executor.models.transformers.utils.replace_conv_class", "vllm.model_executor.models.transformers.utils.replace_linear_class", "vllm.model_executor.models.transformers.utils.replace_rms_norm_class" ], "n_typable": 23, "n_typed": 20, "n_any": 0, "n_untyped": 3, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 14, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/ultravox.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.ultravox.ModifiedWhisperEncoder", "methods": [ { "kind": "function", "name": "ModifiedWhisperEncoder.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModifiedWhisperEncoder.get_attention_mask_by_audio_len", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModifiedWhisperEncoder.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "ModifiedWhisperEncoder.max_context_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ModifiedWhisperEncoder.base_model_prefix", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 10, "n_typed": 4, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 1, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.ultravox.UltravoxProcessingInfo", "methods": [ { "kind": "function", "name": "UltravoxProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UltravoxProcessingInfo.get_feature_extractor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UltravoxProcessingInfo.get_default_tok_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UltravoxProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UltravoxProcessingInfo.get_target_channels", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UltravoxProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ultravox.StackAudioFrames", "methods": [ { "kind": "function", "name": "StackAudioFrames.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StackAudioFrames.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StackAudioFrames.stack_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.ultravox.pad_and_concat_to_dim3", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.ultravox.UltravoxTransformerProjector", "methods": [ { "kind": "function", "name": "UltravoxTransformerProjector.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UltravoxTransformerProjector.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "UltravoxTransformerProjector.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxTransformerProjector.ln_pre", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxTransformerProjector.linear_in", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxTransformerProjector.embed_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxTransformerProjector.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxTransformerProjector.ln_post", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxTransformerProjector.linear_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 4, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ultravox.UltravoxDummyInputsBuilder", "methods": [ { "kind": "function", "name": "UltravoxDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UltravoxDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ultravox.UltravoxAudioEmbeddingInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "UltravoxAudioEmbeddingInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxAudioEmbeddingInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.ultravox.UltravoxAudioInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.ultravox.UltravoxMultiModalProcessor", "methods": [ { "kind": "function", "name": "UltravoxMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "UltravoxMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "UltravoxMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ultravox.UltravoxModel", "methods": [ { "kind": "function", "name": "UltravoxModel.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "UltravoxModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "UltravoxModel.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UltravoxModel._audio_features_to_embeddings", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "UltravoxModel._parse_and_validate_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UltravoxModel._process_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UltravoxModel.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UltravoxModel.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "UltravoxModel.forward", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "UltravoxModel.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UltravoxModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "UltravoxModel.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UltravoxModel.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxModel.multi_modal_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxModel.secondary_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxModel.make_empty_intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxModel.audio_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxModel.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxModel.multi_modal_projector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 30, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 21, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ultravox.UltravoxAudioFeatureInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "UltravoxAudioFeatureInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxAudioFeatureInputs.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxAudioFeatureInputs.lens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxAudioFeatureInputs.token_len", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxAudioFeatureInputs.num_chunks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.ultravox.UltravoxFeedForwardProjector", "methods": [ { "kind": "function", "name": "UltravoxFeedForwardProjector.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UltravoxFeedForwardProjector.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "UltravoxFeedForwardProjector.hidden_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxFeedForwardProjector.ln_pre", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxFeedForwardProjector.linear_1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxFeedForwardProjector.linear_2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxFeedForwardProjector.act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxFeedForwardProjector.ln_mid", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxFeedForwardProjector.ln_post", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 5, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.ultravox", "names": [ "vllm.model_executor.models.ultravox.ModifiedWhisperEncoder", "vllm.model_executor.models.ultravox.StackAudioFrames", "vllm.model_executor.models.ultravox.UltravoxAudioEmbeddingInputs", "vllm.model_executor.models.ultravox.UltravoxAudioFeatureInputs", "vllm.model_executor.models.ultravox.UltravoxAudioInputs", "vllm.model_executor.models.ultravox.UltravoxDummyInputsBuilder", "vllm.model_executor.models.ultravox.UltravoxFeedForwardProjector", "vllm.model_executor.models.ultravox.UltravoxModel", "vllm.model_executor.models.ultravox.UltravoxMultiModalProcessor", "vllm.model_executor.models.ultravox.UltravoxProcessingInfo", "vllm.model_executor.models.ultravox.UltravoxTransformerProjector", "vllm.model_executor.models.ultravox.pad_and_concat_to_dim3" ], "n_typable": 115, "n_typed": 81, "n_any": 0, "n_untyped": 34, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 31, "n_method_overloads": 31, "n_method_params": 50, "n_classes": 10, "n_attrs": 33, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.models.utils.fast_topk", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.model_executor.models.utils.WeightsMapper", "methods": [ { "kind": "function", "name": "WeightsMapper.__or__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WeightsMapper._map_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WeightsMapper.apply", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WeightsMapper.apply_list", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WeightsMapper.apply_dict", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WeightsMapper.orig_to_new_substr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WeightsMapper.orig_to_new_prefix", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WeightsMapper.orig_to_new_suffix", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.utils.collect_children", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.utils.init_vllm_registered_model", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.utils.LayerFn", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.utils.isin_list", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.utils.sequence_parallel_chunk_impl", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.utils.make_empty_intermediate_tensors_factory", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.utils.maybe_prefix", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.utils.no_init_weights", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.models.utils.split_list_into_ranges", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.utils.flatten_bn", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 4, "n_typable": 3, "n_params": 2, "n_function_overloads": 4, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.utils.get_pp_missing_layer_names", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.utils.AutoWeightsLoader", "methods": [ { "kind": "function", "name": "AutoWeightsLoader.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "AutoWeightsLoader._groupby_prefix", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AutoWeightsLoader._get_qualname", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AutoWeightsLoader._can_skip", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AutoWeightsLoader._can_ignore_unexpected", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AutoWeightsLoader._load_param", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AutoWeightsLoader._add_loadable_non_param_tensors", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AutoWeightsLoader._load_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AutoWeightsLoader.load_weights", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AutoWeightsLoader.ROTARY_EMBEDS_UNUSED_WEIGHTS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AutoWeightsLoader.module", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AutoWeightsLoader.skip_prefixes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AutoWeightsLoader.skip_substrs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AutoWeightsLoader.ignore_unexpected_prefixes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AutoWeightsLoader.ignore_unexpected_suffixes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 28, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 20, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.utils.cast_overflow_tensors", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.utils.get_draft_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.utils.StageMissingLayer", "methods": [ { "kind": "function", "name": "StageMissingLayer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StageMissingLayer.__getattr__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StageMissingLayer.__call__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StageMissingLayer.extra_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StageMissingLayer.stage_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.utils.process_eagle_weight", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.utils.get_layer_index", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.utils.sequence_parallel_chunk_impl_fake", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.models.utils.PPMissingLayer", "methods": [ { "kind": "function", "name": "PPMissingLayer.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PPMissingLayer.forward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.utils.extract_layer_index", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.utils.make_layers", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.models.utils.is_pp_missing_parameter", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.utils.sequence_parallel_chunk", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.utils.WeightsMapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.utils", "names": [ "vllm.model_executor.models.utils.AutoWeightsLoader", "vllm.model_executor.models.utils.LayerFn", "vllm.model_executor.models.utils.PPMissingLayer", "vllm.model_executor.models.utils.StageMissingLayer", "vllm.model_executor.models.utils.WeightsMapper", "vllm.model_executor.models.utils.WeightsMapping", "vllm.model_executor.models.utils.cast_overflow_tensors", "vllm.model_executor.models.utils.collect_children", "vllm.model_executor.models.utils.extract_layer_index", "vllm.model_executor.models.utils.fast_topk", "vllm.model_executor.models.utils.flatten_bn", "vllm.model_executor.models.utils.get_draft_quant_config", "vllm.model_executor.models.utils.get_layer_index", "vllm.model_executor.models.utils.get_pp_missing_layer_names", "vllm.model_executor.models.utils.init_vllm_registered_model", "vllm.model_executor.models.utils.is_pp_missing_parameter", "vllm.model_executor.models.utils.isin_list", "vllm.model_executor.models.utils.logger", "vllm.model_executor.models.utils.make_empty_intermediate_tensors_factory", "vllm.model_executor.models.utils.make_layers", "vllm.model_executor.models.utils.maybe_prefix", "vllm.model_executor.models.utils.no_init_weights", "vllm.model_executor.models.utils.process_eagle_weight", "vllm.model_executor.models.utils.sequence_parallel_chunk", "vllm.model_executor.models.utils.sequence_parallel_chunk_impl", "vllm.model_executor.models.utils.sequence_parallel_chunk_impl_fake", "vllm.model_executor.models.utils.split_list_into_ranges" ], "n_typable": 122, "n_typed": 101, "n_any": 0, "n_untyped": 21, "n_functions": 20, "n_function_overloads": 23, "n_function_params": 40, "n_methods": 20, "n_method_overloads": 20, "n_method_params": 34, "n_classes": 5, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/vision.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.vision.VisionEncoderInfo", "methods": [ { "kind": "function", "name": "VisionEncoderInfo.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VisionEncoderInfo.get_num_image_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VisionEncoderInfo.get_image_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VisionEncoderInfo.get_patch_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VisionEncoderInfo.get_patch_grid_length", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VisionEncoderInfo.hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderInfo.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.vision.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.vision.VisionFeatureSelectStrategyStr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.models.vision.run_dp_sharded_vision_model", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.vision.should_torch_compile_mm_vit", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.models.vision.get_llm_pos_ids_for_vision", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.models.vision.resolve_visual_encoder_outputs", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.model_executor.models.vision.get_vit_attn_backend", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.model_executor.models.vision.VisionFeatureSelectStrategy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.models.vision.get_load_balance_assignment", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.vision.is_vit_use_data_parallel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.models.vision.get_num_selected_vision_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.models.vision.run_dp_sharded_mrope_vision_model", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.model_executor.models.vision.VisionLanguageConfig", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.vision.get_vision_encoder_info", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.vision", "names": [ "vllm.model_executor.models.vision.VisionEncoderInfo", "vllm.model_executor.models.vision.VisionFeatureSelectStrategy", "vllm.model_executor.models.vision.VisionFeatureSelectStrategyStr", "vllm.model_executor.models.vision.VisionLanguageConfig", "vllm.model_executor.models.vision.get_llm_pos_ids_for_vision", "vllm.model_executor.models.vision.get_load_balance_assignment", "vllm.model_executor.models.vision.get_num_selected_vision_tokens", "vllm.model_executor.models.vision.get_vision_encoder_info", "vllm.model_executor.models.vision.get_vit_attn_backend", "vllm.model_executor.models.vision.is_vit_use_data_parallel", "vllm.model_executor.models.vision.logger", "vllm.model_executor.models.vision.resolve_visual_encoder_outputs", "vllm.model_executor.models.vision.run_dp_sharded_mrope_vision_model", "vllm.model_executor.models.vision.run_dp_sharded_vision_model", "vllm.model_executor.models.vision.should_torch_compile_mm_vit" ], "n_typable": 49, "n_typed": 45, "n_any": 0, "n_untyped": 4, "n_functions": 10, "n_function_overloads": 10, "n_function_params": 26, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 3, "n_classes": 2, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/voxtral.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.voxtral.AudioLanguageAdapter", "methods": [ { "kind": "function", "name": "AudioLanguageAdapter.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AudioLanguageAdapter.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AudioLanguageAdapter.w_in", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioLanguageAdapter.gelu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioLanguageAdapter.w_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.voxtral.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.voxtral.ISO639_1_SUPPORTED_LANGS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.model_executor.models.voxtral.VoxtralForConditionalGeneration", "methods": [ { "kind": "function", "name": "VoxtralForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VoxtralForConditionalGeneration.get_mm_mapping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VoxtralForConditionalGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "VoxtralForConditionalGeneration.embed_multimodal", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoxtralForConditionalGeneration._parse_and_validate_audio_arrays", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoxtralForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoxtralForConditionalGeneration.get_speech_to_text_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VoxtralForConditionalGeneration.get_generation_prompt", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "VoxtralForConditionalGeneration.get_num_audio_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VoxtralForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoxtralForConditionalGeneration.maybe_update_quant_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VoxtralForConditionalGeneration.supported_languages", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VoxtralForConditionalGeneration.skip_warmup_audio_preprocessing", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VoxtralForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VoxtralForConditionalGeneration.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VoxtralForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VoxtralForConditionalGeneration.downsample_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VoxtralForConditionalGeneration.language_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VoxtralForConditionalGeneration.whisper_encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VoxtralForConditionalGeneration.audio_language_adapter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 41, "n_typed": 33, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 24, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.voxtral.VoxtralMultiModalProcessor", "methods": [ { "kind": "function", "name": "VoxtralMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VoxtralMultiModalProcessor._validate_mm_placeholders", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VoxtralMultiModalProcessor._apply_hf_processor_mm_only", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VoxtralMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VoxtralMultiModalProcessor._cached_apply_hf_processor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 17, "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.voxtral.VoxtralProcessingInfo", "methods": [ { "kind": "function", "name": "VoxtralProcessingInfo.get_tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VoxtralProcessingInfo.get_hf_processor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VoxtralProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VoxtralProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VoxtralProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VoxtralProcessingInfo.get_max_audio_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VoxtralProcessingInfo.get_max_audio_array_len", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.voxtral.VoxtralEncoderModel", "methods": [ { "kind": "function", "name": "VoxtralEncoderModel.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VoxtralEncoderModel.compute_whisper_melspec", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoxtralEncoderModel.prepare_inputs_for_conv", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoxtralEncoderModel.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoxtralEncoderModel.load_weight", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "VoxtralEncoderModel.downsample_factor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VoxtralEncoderModel.chunk_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "VoxtralEncoderModel.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VoxtralEncoderModel.mistral_remapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VoxtralEncoderModel.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VoxtralEncoderModel.dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VoxtralEncoderModel.is_causal", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VoxtralEncoderModel.whisper_encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VoxtralEncoderModel.mel_filters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 14, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_attrs": 7, "n_properties": 2 }, { "kind": "class", "name": "vllm.model_executor.models.voxtral.VoxtralDummyInputsBuilder", "methods": [ { "kind": "function", "name": "VoxtralDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoxtralDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VoxtralDummyInputsBuilder.get_dummy_processor_inputs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.voxtral.VoxtralProcessorAdapter", "methods": [ { "kind": "function", "name": "VoxtralProcessorAdapter.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoxtralProcessorAdapter.get_num_audio_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoxtralProcessorAdapter.__call__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "VoxtralProcessorAdapter._audio_processor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VoxtralProcessorAdapter.audio_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VoxtralProcessorAdapter.begin_audio_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VoxtralProcessorAdapter.sampling_rate", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "VoxtralProcessorAdapter.frame_rate", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "VoxtralProcessorAdapter.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 13, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 1, "n_properties": 5 } ], "type_ignores": [], "name": "vllm.model_executor.models.voxtral", "names": [ "vllm.model_executor.models.voxtral.AudioLanguageAdapter", "vllm.model_executor.models.voxtral.ISO639_1_SUPPORTED_LANGS", "vllm.model_executor.models.voxtral.VoxtralDummyInputsBuilder", "vllm.model_executor.models.voxtral.VoxtralEncoderModel", "vllm.model_executor.models.voxtral.VoxtralForConditionalGeneration", "vllm.model_executor.models.voxtral.VoxtralMultiModalProcessor", "vllm.model_executor.models.voxtral.VoxtralProcessingInfo", "vllm.model_executor.models.voxtral.VoxtralProcessorAdapter", "vllm.model_executor.models.voxtral.logger" ], "n_typable": 119, "n_typed": 100, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 36, "n_method_overloads": 36, "n_method_params": 60, "n_classes": 7, "n_attrs": 22, "n_properties": 7, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/voxtral_realtime.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.voxtral_realtime.VoxtralRealtimeMultiModalProcessor", "methods": [ { "kind": "function", "name": "VoxtralRealtimeMultiModalProcessor.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VoxtralRealtimeMultiModalProcessor._maybe_apply_prompt_updates", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.voxtral_realtime.VoxtralRealtimeGeneration", "methods": [ { "kind": "function", "name": "VoxtralRealtimeGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VoxtralRealtimeGeneration.buffer_realtime_audio", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VoxtralRealtimeGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "VoxtralRealtimeGeneration.forward", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "VoxtralRealtimeGeneration.embed_multimodal", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoxtralRealtimeGeneration.get_speech_to_text_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VoxtralRealtimeGeneration.get_generation_prompt", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [ { "kind": "property", "name": "VoxtralRealtimeGeneration.audio_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "VoxtralRealtimeGeneration.requires_raw_input_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VoxtralRealtimeGeneration.skip_warmup_audio_preprocessing", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VoxtralRealtimeGeneration.time_embedding", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VoxtralRealtimeGeneration.n_delay_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 30, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 24, "n_attrs": 4, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.voxtral_realtime.VoxtralRealtimeBuffer", "methods": [ { "kind": "function", "name": "VoxtralRealtimeBuffer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VoxtralRealtimeBuffer._generate_frame_size_and_num_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "VoxtralRealtimeBuffer._ms_to_samples", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoxtralRealtimeBuffer.append_audio", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoxtralRealtimeBuffer.append_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoxtralRealtimeBuffer.get_input_stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.voxtral_realtime.TimeEmbedding", "methods": [ { "kind": "function", "name": "TimeEmbedding.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TimeEmbedding.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TimeEmbedding.dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TimeEmbedding.theta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.voxtral_realtime.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.models.voxtral_realtime", "names": [ "vllm.model_executor.models.voxtral_realtime.TimeEmbedding", "vllm.model_executor.models.voxtral_realtime.VoxtralRealtimeBuffer", "vllm.model_executor.models.voxtral_realtime.VoxtralRealtimeGeneration", "vllm.model_executor.models.voxtral_realtime.VoxtralRealtimeMultiModalProcessor", "vllm.model_executor.models.voxtral_realtime.logger" ], "n_typable": 63, "n_typed": 56, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 40, "n_classes": 4, "n_attrs": 7, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/voyage.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.voyage.VoyageQwen3BidirectionalEmbedModel", "methods": [ { "kind": "function", "name": "VoyageQwen3BidirectionalEmbedModel.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VoyageQwen3BidirectionalEmbedModel.forward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VoyageQwen3BidirectionalEmbedModel._fuse_qkv_proj", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoyageQwen3BidirectionalEmbedModel._fuse_gate_up_proj", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VoyageQwen3BidirectionalEmbedModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VoyageQwen3BidirectionalEmbedModel.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VoyageQwen3BidirectionalEmbedModel.linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 6, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.voyage.WeightItem", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.voyage", "names": [ "vllm.model_executor.models.voyage.VoyageQwen3BidirectionalEmbedModel", "vllm.model_executor.models.voyage.WeightItem" ], "n_typable": 14, "n_typed": 6, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 7, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/whisper.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.whisper.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperPositionalEmbedding", "methods": [ { "kind": "function", "name": "WhisperPositionalEmbedding.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WhisperPositionalEmbedding.forward", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperForConditionalGeneration", "methods": [ { "kind": "function", "name": "WhisperForConditionalGeneration.validate_language", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WhisperForConditionalGeneration.get_generation_prompt", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "WhisperForConditionalGeneration.get_language_token_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WhisperForConditionalGeneration.get_language_detection_prompt", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WhisperForConditionalGeneration.parse_language_detection_output", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WhisperForConditionalGeneration.get_placeholder_str", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WhisperForConditionalGeneration.get_speech_to_text_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WhisperForConditionalGeneration.get_num_audio_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "WhisperForConditionalGeneration.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WhisperForConditionalGeneration.forward", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "WhisperForConditionalGeneration.embed_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WhisperForConditionalGeneration.embed_input_ids", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "WhisperForConditionalGeneration._parse_and_validate_audio_input", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WhisperForConditionalGeneration.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WhisperForConditionalGeneration.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WhisperForConditionalGeneration.packed_modules_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WhisperForConditionalGeneration.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperForConditionalGeneration.supports_transcription_only", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WhisperForConditionalGeneration.supports_segment_timestamp", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WhisperForConditionalGeneration.supports_explicit_language_detection", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WhisperForConditionalGeneration.supported_languages", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WhisperForConditionalGeneration.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperForConditionalGeneration.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperForConditionalGeneration.proj_out", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperForConditionalGeneration.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperForConditionalGeneration.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 55, "n_typed": 47, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 34, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperEncoder", "methods": [ { "kind": "function", "name": "WhisperEncoder.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "WhisperEncoder.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WhisperEncoder.pos_embed_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperEncoder.num_mel_bins", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperEncoder.max_source_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperEncoder.embed_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperEncoder.conv1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperEncoder.conv2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperEncoder.total_stride", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperEncoder.layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperEncoder.embed_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 5, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperMultiModalProcessor", "methods": [ { "kind": "function", "name": "WhisperMultiModalProcessor.create_encoder_prompt", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WhisperMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "WhisperMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WhisperMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 15, "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperMLP", "methods": [ { "kind": "function", "name": "WhisperMLP.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "WhisperMLP.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WhisperMLP.activation_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperMLP.fc1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperMLP.fc2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperEncoderAttention", "methods": [ { "kind": "function", "name": "WhisperEncoderAttention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperProcessingInfo", "methods": [ { "kind": "function", "name": "WhisperProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WhisperProcessingInfo.get_default_tok_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WhisperProcessingInfo.get_data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WhisperProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WhisperProcessingInfo.get_feature_extractor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WhisperProcessingInfo.get_target_channels", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WhisperProcessingInfo.get_num_audio_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "WhisperProcessingInfo.skip_prompt_length_check", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 1, "n_attrs": 0, "n_properties": 1 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperDecoder", "methods": [ { "kind": "function", "name": "WhisperDecoder.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WhisperDecoder.forward", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "WhisperDecoder.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WhisperDecoder.layerdrop", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperDecoder.padding_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperDecoder.max_target_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperDecoder.max_source_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperDecoder.embed_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperDecoder.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperDecoder.embed_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperDecoder.layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 6, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperEncoderLayer", "methods": [ { "kind": "function", "name": "WhisperEncoderLayer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WhisperEncoderLayer.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WhisperEncoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperEncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperEncoderLayer.self_attn_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperEncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperEncoderLayer.final_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 3, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperAttention", "methods": [ { "kind": "function", "name": "WhisperAttention.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "WhisperAttention._init_qkv", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "WhisperAttention.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WhisperAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperAttention.attn_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 14, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 13, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperCrossAttention", "methods": [ { "kind": "function", "name": "WhisperCrossAttention.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "WhisperCrossAttention._init_qkv", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "WhisperCrossAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 15, "n_typed": 13, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 12, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperDecoderLayer", "methods": [ { "kind": "function", "name": "WhisperDecoderLayer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WhisperDecoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WhisperDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperDecoderLayer.self_attn_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperDecoderLayer.encoder_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperDecoderLayer.encoder_attn_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperDecoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperDecoderLayer.final_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 4, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperModel", "methods": [ { "kind": "function", "name": "WhisperModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WhisperModel.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "WhisperModel.get_encoder_outputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WhisperModel.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WhisperModel.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperModel.decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 10, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperPosEmbedType", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "WhisperPosEmbedType.SINUSOIDAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WhisperPosEmbedType.ROPE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WhisperPosEmbedType.LEARNED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperAudioInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "WhisperAudioInputs.input_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper.WhisperDummyInputsBuilder", "methods": [ { "kind": "function", "name": "WhisperDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WhisperDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.whisper", "names": [ "vllm.model_executor.models.whisper.WhisperAttention", "vllm.model_executor.models.whisper.WhisperAudioInputs", "vllm.model_executor.models.whisper.WhisperCrossAttention", "vllm.model_executor.models.whisper.WhisperDecoder", "vllm.model_executor.models.whisper.WhisperDecoderLayer", "vllm.model_executor.models.whisper.WhisperDummyInputsBuilder", "vllm.model_executor.models.whisper.WhisperEncoder", "vllm.model_executor.models.whisper.WhisperEncoderAttention", "vllm.model_executor.models.whisper.WhisperEncoderLayer", "vllm.model_executor.models.whisper.WhisperForConditionalGeneration", "vllm.model_executor.models.whisper.WhisperMLP", "vllm.model_executor.models.whisper.WhisperModel", "vllm.model_executor.models.whisper.WhisperMultiModalProcessor", "vllm.model_executor.models.whisper.WhisperPosEmbedType", "vllm.model_executor.models.whisper.WhisperPositionalEmbedding", "vllm.model_executor.models.whisper.WhisperProcessingInfo", "vllm.model_executor.models.whisper.logger" ], "n_typable": 216, "n_typed": 144, "n_any": 0, "n_untyped": 72, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 52, "n_method_overloads": 52, "n_method_params": 111, "n_classes": 16, "n_attrs": 60, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/whisper_causal.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.whisper_causal.CausalRMSNorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.models.whisper_causal.WhisperCausalAttention", "methods": [ { "kind": "function", "name": "WhisperCausalAttention.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "WhisperCausalAttention._init_rotary_emb", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WhisperCausalAttention._init_qkv", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "WhisperCausalAttention.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WhisperCausalAttention.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalAttention.total_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalAttention.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalAttention.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalAttention.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalAttention.q_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalAttention.kv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalAttention.attn_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalAttention.scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalAttention.out_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalAttention.attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 20, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 18, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper_causal.WhisperCausalEncoderLayer", "methods": [ { "kind": "function", "name": "WhisperCausalEncoderLayer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WhisperCausalEncoderLayer.forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WhisperCausalEncoderLayer.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalEncoderLayer.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalEncoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalEncoderLayer.self_attn_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalEncoderLayer.mlp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalEncoderLayer.final_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 4, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper_causal.WhisperCausalAttentionWithBlockPooling", "methods": [ { "kind": "function", "name": "WhisperCausalAttentionWithBlockPooling.__init__", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "WhisperCausalAttentionWithBlockPooling.get_kv_cache_spec", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WhisperCausalAttentionWithBlockPooling.block_pool_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 16, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 16, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.whisper_causal.WhisperCausalConv1d", "methods": [ { "kind": "function", "name": "WhisperCausalConv1d.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "WhisperCausalConv1d.forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.models.whisper_causal.create_whisper_attention_backend_with_block_pooling", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.model_executor.models.whisper_causal.WhisperCausalEncoder", "methods": [ { "kind": "function", "name": "WhisperCausalEncoder.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WhisperCausalEncoder.forward_conv", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WhisperCausalEncoder.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WhisperCausalEncoder.num_mel_bins", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalEncoder.max_source_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalEncoder.embed_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalEncoder.conv1", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalEncoder.conv2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalEncoder.total_stride", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WhisperCausalEncoder.layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 7, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.models.whisper_causal.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.models.whisper_causal.AiterFlashAttentionBackend", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.whisper_causal", "names": [ "vllm.model_executor.models.whisper_causal.AiterFlashAttentionBackend", "vllm.model_executor.models.whisper_causal.CausalRMSNorm", "vllm.model_executor.models.whisper_causal.WhisperCausalAttention", "vllm.model_executor.models.whisper_causal.WhisperCausalAttentionWithBlockPooling", "vllm.model_executor.models.whisper_causal.WhisperCausalConv1d", "vllm.model_executor.models.whisper_causal.WhisperCausalEncoder", "vllm.model_executor.models.whisper_causal.WhisperCausalEncoderLayer", "vllm.model_executor.models.whisper_causal.create_whisper_attention_backend_with_block_pooling", "vllm.model_executor.models.whisper_causal.logger" ], "n_typable": 93, "n_typed": 59, "n_any": 0, "n_untyped": 34, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 50, "n_classes": 5, "n_attrs": 28, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/whisper_utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.models.whisper_utils.ISO639_1_SUPPORTED_LANGS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.whisper_utils", "names": [ "vllm.model_executor.models.whisper_utils.ISO639_1_SUPPORTED_LANGS" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/models/zamba2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.models.zamba2.Zamba2MambaDecoderLayer", "methods": [ { "kind": "function", "name": "Zamba2MambaDecoderLayer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Zamba2MambaDecoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Zamba2MambaDecoderLayer.mamba", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2MambaDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 11, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.zamba2.Zamba2LoRA", "methods": [ { "kind": "function", "name": "Zamba2LoRA.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Zamba2LoRA.forward", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Zamba2LoRA.A", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2LoRA.B", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 6, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.zamba2.Zamba2HybridLayer", "methods": [ { "kind": "function", "name": "Zamba2HybridLayer.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Zamba2HybridLayer.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Zamba2HybridLayer.block_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2HybridLayer.shared_transformer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2HybridLayer.linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2HybridLayer.mamba_decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 12, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.zamba2.Zamba2AttentionDecoderLayer", "methods": [ { "kind": "function", "name": "Zamba2AttentionDecoderLayer.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Zamba2AttentionDecoderLayer.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Zamba2AttentionDecoderLayer.self_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2AttentionDecoderLayer.feed_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2AttentionDecoderLayer.input_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2AttentionDecoderLayer.pre_ff_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 12, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.zamba2.Zamba2Attention", "methods": [ { "kind": "function", "name": "Zamba2Attention.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Zamba2Attention.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Zamba2Attention.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Attention.num_hybrid_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Attention.attention_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Attention.total_num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Attention.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Attention.attention_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Attention.qkv_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Attention.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Attention.qkv_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Attention.o_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Attention.dpa_list", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Attention.linear_q_adapter_list", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Attention.linear_k_adapter_list", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Attention.linear_v_adapter_list", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Attention.rotary_emb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 11, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 9, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.zamba2.Zamba2Model", "methods": [ { "kind": "function", "name": "Zamba2Model.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Zamba2Model.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Zamba2Model.forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Zamba2Model.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Zamba2Model.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Model.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Model.embed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Model.layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2Model.final_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.zamba2.Zamba2ForCausalLM", "methods": [ { "kind": "function", "name": "Zamba2ForCausalLM.get_mamba_state_dtype_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Zamba2ForCausalLM.get_mamba_state_shape_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Zamba2ForCausalLM.get_mamba_state_copy_func", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Zamba2ForCausalLM.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Zamba2ForCausalLM.embed_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Zamba2ForCausalLM.forward", "n_typed": 4, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Zamba2ForCausalLM.compute_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Zamba2ForCausalLM.load_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Zamba2ForCausalLM.hf_to_vllm_mapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2ForCausalLM.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2ForCausalLM.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2ForCausalLM.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2ForCausalLM.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2ForCausalLM.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2ForCausalLM.lm_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2ForCausalLM.logits_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 18, "n_any": 1, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 11, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.models.zamba2.Zamba2MLP", "methods": [ { "kind": "function", "name": "Zamba2MLP.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Zamba2MLP.forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Zamba2MLP.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2MLP.tp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2MLP.num_hybrid_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2MLP.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2MLP.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2MLP.gate_up_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2MLP.down_proj", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2MLP.act_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Zamba2MLP.gate_up_proj_adapter_list", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 9, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.model_executor.models.zamba2", "names": [ "vllm.model_executor.models.zamba2.Zamba2Attention", "vllm.model_executor.models.zamba2.Zamba2AttentionDecoderLayer", "vllm.model_executor.models.zamba2.Zamba2ForCausalLM", "vllm.model_executor.models.zamba2.Zamba2HybridLayer", "vllm.model_executor.models.zamba2.Zamba2LoRA", "vllm.model_executor.models.zamba2.Zamba2MLP", "vllm.model_executor.models.zamba2.Zamba2MambaDecoderLayer", "vllm.model_executor.models.zamba2.Zamba2Model" ], "n_typable": 142, "n_typed": 90, "n_any": 1, "n_untyped": 51, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 24, "n_method_overloads": 24, "n_method_params": 69, "n_classes": 8, "n_attrs": 49, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/offloader/uva.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.offloader.uva.UVAOffloader", "methods": [ { "kind": "function", "name": "UVAOffloader.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "UVAOffloader.wrap_modules", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UVAOffloader._maybe_offload_to_cpu", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "UVAOffloader.cpu_offload_max_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UVAOffloader.cpu_offload_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UVAOffloader.cpu_offload_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UVAOffloader.pin_memory", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UVAOffloader.uva_offloading", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 6, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.offloader.uva.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.offloader.uva", "names": [ "vllm.model_executor.offloader.uva.UVAOffloader", "vllm.model_executor.offloader.uva.logger" ], "n_typable": 13, "n_typed": 6, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/offloader/base.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.offloader.base.NoopOffloader", "methods": [ { "kind": "function", "name": "NoopOffloader.wrap_modules", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.offloader.base.create_offloader", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.model_executor.offloader.base.BaseOffloader", "methods": [ { "kind": "function", "name": "BaseOffloader.wrap_modules", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseOffloader.post_init", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseOffloader.sync_prev_onload", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseOffloader.join_after_forward", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseOffloader._wait_for_layer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseOffloader._start_prefetch", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.model_executor.offloader.base.get_offloader", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.model_executor.offloader.base.set_offloader", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.offloader.base.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.model_executor.offloader.base", "names": [ "vllm.model_executor.offloader.base.BaseOffloader", "vllm.model_executor.offloader.base.NoopOffloader", "vllm.model_executor.offloader.base.create_offloader", "vllm.model_executor.offloader.base.get_offloader", "vllm.model_executor.offloader.base.logger", "vllm.model_executor.offloader.base.set_offloader" ], "n_typable": 17, "n_typed": 15, "n_any": 0, "n_untyped": 2, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 2, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 4, "n_classes": 2, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/offloader/prefetch.py", "symbol_reports": [ { "kind": "class", "name": "vllm.model_executor.offloader.prefetch.PrefetchOffloader", "methods": [ { "kind": "function", "name": "PrefetchOffloader.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "PrefetchOffloader.wrap_modules", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PrefetchOffloader._hook_module_forward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PrefetchOffloader._wait_for_layer", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PrefetchOffloader.sync_prev_onload", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PrefetchOffloader._start_prefetch", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PrefetchOffloader.join_after_forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PrefetchOffloader.post_init", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PrefetchOffloader.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrefetchOffloader.num_in_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrefetchOffloader.prefetch_step", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrefetchOffloader.offload_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrefetchOffloader.mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrefetchOffloader.copy_stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrefetchOffloader.module_offloaders", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PrefetchOffloader.buffer_pool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PrefetchOffloader.total_offloaded_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 13, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 10, "n_attrs": 9, "n_properties": 0 }, { "kind": "attr", "name": "vllm.model_executor.offloader.prefetch.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.model_executor.offloader.prefetch.StaticBufferPool", "methods": [ { "kind": "function", "name": "StaticBufferPool.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "StaticBufferPool.get_buffer", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StaticBufferPool.slot_capacity", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StaticBufferPool.total_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.model_executor.offloader.prefetch.ParamInfo", "methods": [], "properties": [ { "kind": "property", "name": "ParamInfo.key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ParamInfo.num_bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ParamInfo.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ParamInfo.shape", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ParamInfo.stride", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ParamInfo.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 2 } ], "type_ignores": [], "name": "vllm.model_executor.offloader.prefetch", "names": [ "vllm.model_executor.offloader.prefetch.ParamInfo", "vllm.model_executor.offloader.prefetch.PrefetchOffloader", "vllm.model_executor.offloader.prefetch.StaticBufferPool", "vllm.model_executor.offloader.prefetch.logger" ], "n_typable": 42, "n_typed": 24, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 18, "n_classes": 3, "n_attrs": 16, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/model_executor/offloader/prefetch_ops.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.offloader.prefetch_ops.register_prefetch_offloader_ops", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.model_executor.offloader.prefetch_ops", "names": [ "vllm.model_executor.offloader.prefetch_ops.register_prefetch_offloader_ops" ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.utils.set_weight_attrs", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.model_executor.utils.maybe_disable_graph_partition", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.utils.replace_parameter", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.utils.get_moe_expert_mapping", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.model_executor.utils.get_packed_modules_mapping", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.utils", "names": [ "vllm.model_executor.utils.get_moe_expert_mapping", "vllm.model_executor.utils.get_packed_modules_mapping", "vllm.model_executor.utils.maybe_disable_graph_partition", "vllm.model_executor.utils.replace_parameter", "vllm.model_executor.utils.set_weight_attrs" ], "n_typable": 13, "n_typed": 11, "n_any": 0, "n_untyped": 2, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 8, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/warmup/deep_gemm_warmup.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.model_executor.warmup.deep_gemm_warmup.FP8_GEMM_NT_WARMUP_CACHE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.model_executor.warmup.deep_gemm_warmup.GROUPED_FP8_GEMM_NT_CONTIGUOUS_WARMUP_CACHE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.warmup.deep_gemm_warmup.deepgemm_grouped_fp8_gemm_nt_contiguous_warmup", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.warmup.deep_gemm_warmup.deepgemm_fp8_gemm_nt_warmup", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.model_executor.warmup.deep_gemm_warmup.deep_gemm_warmup", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.model_executor.warmup.deep_gemm_warmup", "names": [ "vllm.model_executor.warmup.deep_gemm_warmup.FP8_GEMM_NT_WARMUP_CACHE", "vllm.model_executor.warmup.deep_gemm_warmup.GROUPED_FP8_GEMM_NT_CONTIGUOUS_WARMUP_CACHE", "vllm.model_executor.warmup.deep_gemm_warmup.deep_gemm_warmup", "vllm.model_executor.warmup.deep_gemm_warmup.deepgemm_fp8_gemm_nt_warmup", "vllm.model_executor.warmup.deep_gemm_warmup.deepgemm_grouped_fp8_gemm_nt_contiguous_warmup" ], "n_typable": 13, "n_typed": 10, "n_any": 0, "n_untyped": 3, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 8, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_executor/warmup/kernel_warmup.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_executor.warmup.kernel_warmup.kernel_warmup", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.model_executor.warmup.kernel_warmup.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.model_executor.warmup.kernel_warmup.flashinfer_autotune", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_executor.warmup.kernel_warmup", "names": [ "vllm.model_executor.warmup.kernel_warmup.flashinfer_autotune", "vllm.model_executor.warmup.kernel_warmup.kernel_warmup", "vllm.model_executor.warmup.kernel_warmup.logger" ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 2, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/model_inspection.py", "symbol_reports": [ { "kind": "function", "name": "vllm.model_inspection.format_model_inspection", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.model_inspection", "names": [ "vllm.model_inspection.format_model_inspection" ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/multimodal/inputs.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.multimodal.inputs.MultiModalUUIDDict", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.multimodal.inputs.ModalityData", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.multimodal.inputs.NestedTensors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.multimodal.inputs.MultiModalKwargsItems", "methods": [ { "kind": "function", "name": "MultiModalKwargsItems.from_hf_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalKwargsItems.__getitem__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalKwargsItems.require_data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiModalKwargsItems.get_data", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.inputs.BatchedTensorInputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.multimodal.inputs.MultiModalDataBuiltins", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalDataBuiltins.image", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModalDataBuiltins.video", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModalDataBuiltins.audio", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModalDataBuiltins.vision_chunk", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.inputs.MultiModalPlaceholderDict", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.multimodal.inputs.MultiModalDataDict", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.multimodal.inputs.batched_tensors_equal", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.multimodal.inputs.MultiModalFlatField", "methods": [ { "kind": "function", "name": "MultiModalFlatField.build_elems", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MultiModalFlatField._reduce_data", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalFlatField.slices", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModalFlatField.dim", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.inputs.VideoItem", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.multimodal.inputs.mm_enc_dec_inputs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.multimodal.inputs.MultiModalEncDecInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalEncDecInputs.encoder_prompt_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalEncDecInputs.encoder_prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.inputs.ImageItem", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.multimodal.inputs.nested_tensors_equal", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.multimodal.inputs.MultiModalBatchedField", "methods": [ { "kind": "function", "name": "MultiModalBatchedField.build_elems", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MultiModalBatchedField._reduce_data", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.inputs.MultiModalKwargsOptionalItems", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.multimodal.inputs.HfVideoItem", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.multimodal.inputs.MultiModalHashes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.multimodal.inputs.BaseMultiModalField", "methods": [ { "kind": "function", "name": "BaseMultiModalField._field_factory", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseMultiModalField.build_elems", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseMultiModalField._reduce_data", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalField.reduce_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseMultiModalField.keep_on_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.inputs.HfAudioItem", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.multimodal.inputs.torch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.multimodal.inputs.HfImageItem", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.multimodal.inputs.VisionChunkVideo", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "VisionChunkVideo.type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionChunkVideo.video_chunk", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionChunkVideo.uuid", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionChunkVideo.prompt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionChunkVideo.video_idx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.inputs.MultiModalInputs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalInputs.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalInputs.prompt_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalInputs.prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalInputs.mm_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalInputs.mm_hashes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalInputs.mm_placeholders", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.inputs.AudioItem", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.multimodal.inputs.MultiModalSharedField", "methods": [ { "kind": "function", "name": "MultiModalSharedField.build_elems", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MultiModalSharedField._reduce_data", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalSharedField.batch_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.inputs.MultiModalFieldElem", "methods": [ { "kind": "function", "name": "MultiModalFieldElem.__eq__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalFieldElem.data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModalFieldElem.field", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.inputs.PlaceholderRange", "methods": [ { "kind": "function", "name": "PlaceholderRange.get_num_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PlaceholderRange.get_embeds_indices_in_range", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PlaceholderRange.extract_embeds_range", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PlaceholderRange.__eq__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "PlaceholderRange.embeds_cumsum", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "PlaceholderRange.offset", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PlaceholderRange.length", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PlaceholderRange.is_embed", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 3, "n_properties": 1 }, { "kind": "class", "name": "vllm.multimodal.inputs.VisionChunkImage", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "VisionChunkImage.type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionChunkImage.image", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "VisionChunkImage.uuid", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.inputs.VisionChunk", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.multimodal.inputs.MultiModalFeatureSpec", "methods": [ { "kind": "function", "name": "MultiModalFeatureSpec.gather_kwargs", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalFeatureSpec.data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModalFeatureSpec.modality", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModalFeatureSpec.identifier", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModalFeatureSpec.mm_position", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModalFeatureSpec.mm_hash", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.inputs.MultiModalFieldConfig", "methods": [ { "kind": "function", "name": "MultiModalFieldConfig.batched", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalFieldConfig.flat", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MultiModalFieldConfig.flat_from_sizes", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MultiModalFieldConfig.shared", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MultiModalFieldConfig.build_elems", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalFieldConfig.field", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModalFieldConfig.modality", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 20, "n_typed": 16, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 15, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.multimodal.inputs.mm_inputs", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "class", "name": "vllm.multimodal.inputs.MultiModalKwargsItem", "methods": [ { "kind": "function", "name": "MultiModalKwargsItem.dummy", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalKwargsItem.get_data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.multimodal.inputs", "names": [ "vllm.multimodal.inputs.AudioItem", "vllm.multimodal.inputs.BaseMultiModalField", "vllm.multimodal.inputs.BatchedTensorInputs", "vllm.multimodal.inputs.HfAudioItem", "vllm.multimodal.inputs.HfImageItem", "vllm.multimodal.inputs.HfVideoItem", "vllm.multimodal.inputs.ImageItem", "vllm.multimodal.inputs.ModalityData", "vllm.multimodal.inputs.MultiModalBatchedField", "vllm.multimodal.inputs.MultiModalDataBuiltins", "vllm.multimodal.inputs.MultiModalDataDict", "vllm.multimodal.inputs.MultiModalEncDecInputs", "vllm.multimodal.inputs.MultiModalFeatureSpec", "vllm.multimodal.inputs.MultiModalFieldConfig", "vllm.multimodal.inputs.MultiModalFieldElem", "vllm.multimodal.inputs.MultiModalFlatField", "vllm.multimodal.inputs.MultiModalHashes", "vllm.multimodal.inputs.MultiModalInputs", "vllm.multimodal.inputs.MultiModalKwargsItem", "vllm.multimodal.inputs.MultiModalKwargsItems", "vllm.multimodal.inputs.MultiModalKwargsOptionalItems", "vllm.multimodal.inputs.MultiModalPlaceholderDict", "vllm.multimodal.inputs.MultiModalSharedField", "vllm.multimodal.inputs.MultiModalUUIDDict", "vllm.multimodal.inputs.NestedTensors", "vllm.multimodal.inputs.PlaceholderRange", "vllm.multimodal.inputs.VideoItem", "vllm.multimodal.inputs.VisionChunk", "vllm.multimodal.inputs.VisionChunkImage", "vllm.multimodal.inputs.VisionChunkVideo", "vllm.multimodal.inputs.batched_tensors_equal", "vllm.multimodal.inputs.mm_enc_dec_inputs", "vllm.multimodal.inputs.mm_inputs", "vllm.multimodal.inputs.nested_tensors_equal", "vllm.multimodal.inputs.torch" ], "n_typable": 117, "n_typed": 108, "n_any": 0, "n_untyped": 9, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 13, "n_methods": 27, "n_method_overloads": 27, "n_method_params": 50, "n_classes": 15, "n_attrs": 52, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/multimodal/__init__.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.multimodal.MULTIMODAL_REGISTRY", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.multimodal", "names": [ "vllm.multimodal.MULTIMODAL_REGISTRY" ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/multimodal/registry.py", "symbol_reports": [ { "kind": "class", "name": "vllm.multimodal.registry.MultiModalRegistry", "methods": [ { "kind": "function", "name": "MultiModalRegistry.supports_multimodal_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalRegistry.register_processor", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MultiModalRegistry._get_model_cls", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalRegistry._create_processing_ctx", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalRegistry._create_processing_info", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalRegistry.create_processor", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MultiModalRegistry.get_dummy_mm_inputs", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MultiModalRegistry._get_cache_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalRegistry.processor_cache_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalRegistry.processor_only_cache_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalRegistry.engine_receiver_cache_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalRegistry.worker_receiver_cache_from_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 34, "n_typed": 33, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 22, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.registry.MultiModalProcessorFactory", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.registry.ProcessingInfoFactory", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.registry.DummyInputsBuilderFactory", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.registry.MultiModalTimingRegistry", "methods": [ { "kind": "function", "name": "MultiModalTimingRegistry.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalTimingRegistry.get", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalTimingRegistry.stat", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.registry.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.multimodal.registry.N", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [ { "kind": "type", "rules": [ "misc" ] }, { "kind": "type", "rules": [ "misc" ] } ], "name": "vllm.multimodal.registry", "names": [ "vllm.multimodal.registry.DummyInputsBuilderFactory", "vllm.multimodal.registry.MultiModalProcessorFactory", "vllm.multimodal.registry.MultiModalRegistry", "vllm.multimodal.registry.MultiModalTimingRegistry", "vllm.multimodal.registry.N", "vllm.multimodal.registry.ProcessingInfoFactory", "vllm.multimodal.registry.logger" ], "n_typable": 40, "n_typed": 38, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 24, "n_classes": 5, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 2 }, { "path": "vllm/multimodal/hasher.py", "symbol_reports": [ { "kind": "class", "name": "vllm.multimodal.hasher.MultiModalHasher", "methods": [ { "kind": "function", "name": "MultiModalHasher.serialize_item", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalHasher.iter_item_to_bytes", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalHasher.hash_kwargs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.hasher.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.multimodal.hasher", "names": [ "vllm.multimodal.hasher.MultiModalHasher", "vllm.multimodal.hasher.logger" ], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/multimodal/audio.py", "symbol_reports": [ { "kind": "class", "name": "vllm.multimodal.audio.AudioSpec", "methods": [ { "kind": "function", "name": "AudioSpec.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "AudioSpec.needs_normalization", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "AudioSpec.target_channels", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AudioSpec.channel_reduction", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 2, "n_properties": 1 }, { "kind": "attr", "name": "vllm.multimodal.audio.MONO_AUDIO_SPEC", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.multimodal.audio.split_audio", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.multimodal.audio.resample_audio_librosa", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.multimodal.audio.normalize_audio", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.multimodal.audio.AudioResampler", "methods": [ { "kind": "function", "name": "AudioResampler.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AudioResampler.resample", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AudioResampler.target_sr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AudioResampler.method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.audio.scipy_signal", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.multimodal.audio.PASSTHROUGH_AUDIO_SPEC", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.multimodal.audio.find_split_point", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.multimodal.audio.resample_audio_scipy", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.multimodal.audio.ChannelReduction", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ChannelReduction.MEAN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChannelReduction.FIRST", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChannelReduction.MAX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChannelReduction.SUM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.audio.librosa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] } ], "name": "vllm.multimodal.audio", "names": [ "vllm.multimodal.audio.AudioResampler", "vllm.multimodal.audio.AudioSpec", "vllm.multimodal.audio.ChannelReduction", "vllm.multimodal.audio.MONO_AUDIO_SPEC", "vllm.multimodal.audio.PASSTHROUGH_AUDIO_SPEC", "vllm.multimodal.audio.find_split_point", "vllm.multimodal.audio.librosa", "vllm.multimodal.audio.normalize_audio", "vllm.multimodal.audio.resample_audio_librosa", "vllm.multimodal.audio.resample_audio_scipy", "vllm.multimodal.audio.scipy_signal", "vllm.multimodal.audio.split_audio" ], "n_typable": 36, "n_typed": 28, "n_any": 0, "n_untyped": 8, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 17, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_classes": 3, "n_attrs": 12, "n_properties": 1, "n_type_ignores": 2 }, { "path": "vllm/multimodal/cache.py", "symbol_reports": [ { "kind": "class", "name": "vllm.multimodal.cache.BaseMultiModalProcessorCache", "methods": [ { "kind": "function", "name": "BaseMultiModalProcessorCache.is_cached_item", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseMultiModalProcessorCache.is_cached", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseMultiModalProcessorCache.close", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseMultiModalProcessorCache.touch_sender_cache_item", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseMultiModalProcessorCache.make_stats", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.cache.MultiModalCache", "methods": [ { "kind": "function", "name": "MultiModalCache.get_leaf_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalCache.get_item_size", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalCache.get_item_complexity", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalCache.get_lru_cache", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.cache.MultiModalProcessorCacheItemMetadata", "methods": [ { "kind": "function", "name": "MultiModalProcessorCacheItemMetadata.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalProcessorCacheItemMetadata.item_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalProcessorCacheItemMetadata.prompt_updates", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.cache.MultiModalReceiverCache", "methods": [ { "kind": "function", "name": "MultiModalReceiverCache.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalReceiverCache.get_and_update_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalReceiverCache.touch_receiver_cache_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalReceiverCache.clear_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.cache.ShmObjectStoreSenderCache", "methods": [ { "kind": "function", "name": "ShmObjectStoreSenderCache.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ShmObjectStoreSenderCache._stat", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ShmObjectStoreSenderCache.is_cached_item", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ShmObjectStoreSenderCache.get_and_update_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ShmObjectStoreSenderCache.touch_sender_cache_item", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ShmObjectStoreSenderCache.clear_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ShmObjectStoreSenderCache.make_stats", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ShmObjectStoreSenderCache.close", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ShmObjectStoreSenderCache.remove_dangling_items", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ShmObjectStoreSenderCache.address_as_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ShmObjectStoreSenderCache.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 19, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 9, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.cache.MultiModalCacheValue", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.multimodal.cache.BaseMultiModalCache", "methods": [ { "kind": "function", "name": "BaseMultiModalCache.get_and_update_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalCache.get_and_update", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalCache.clear_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.cache.MultiModalProcessorCacheOutItem", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.multimodal.cache.MultiModalProcessorSenderCache", "methods": [ { "kind": "function", "name": "MultiModalProcessorSenderCache.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalProcessorSenderCache.is_cached_item", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalProcessorSenderCache.get_and_update_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalProcessorSenderCache.touch_sender_cache_item", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalProcessorSenderCache.clear_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiModalProcessorSenderCache.make_stats", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.cache.MultiModalProcessorCacheInItem", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.multimodal.cache.ShmObjectStoreReceiverCache", "methods": [ { "kind": "function", "name": "ShmObjectStoreReceiverCache.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ShmObjectStoreReceiverCache.get_and_update_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ShmObjectStoreReceiverCache.touch_receiver_cache_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ShmObjectStoreReceiverCache.clear_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ShmObjectStoreReceiverCache.world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.cache.MultiModalProcessorOnlyCache", "methods": [ { "kind": "function", "name": "MultiModalProcessorOnlyCache.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalProcessorOnlyCache.is_cached_item", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalProcessorOnlyCache.get_and_update_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalProcessorOnlyCache.touch_sender_cache_item", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalProcessorOnlyCache.clear_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiModalProcessorOnlyCache.make_stats", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.cache.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.multimodal.cache.BaseMultiModalReceiverCache", "methods": [ { "kind": "function", "name": "BaseMultiModalReceiverCache.get_and_update_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseMultiModalReceiverCache.touch_receiver_cache_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.cache.MultiModalProcessorCacheItem", "methods": [ { "kind": "function", "name": "MultiModalProcessorCacheItem.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalProcessorCacheItem.item", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalProcessorCacheItem.prompt_updates", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.multimodal.cache", "names": [ "vllm.multimodal.cache.BaseMultiModalCache", "vllm.multimodal.cache.BaseMultiModalProcessorCache", "vllm.multimodal.cache.BaseMultiModalReceiverCache", "vllm.multimodal.cache.MultiModalCache", "vllm.multimodal.cache.MultiModalCacheValue", "vllm.multimodal.cache.MultiModalProcessorCacheInItem", "vllm.multimodal.cache.MultiModalProcessorCacheItem", "vllm.multimodal.cache.MultiModalProcessorCacheItemMetadata", "vllm.multimodal.cache.MultiModalProcessorCacheOutItem", "vllm.multimodal.cache.MultiModalProcessorOnlyCache", "vllm.multimodal.cache.MultiModalProcessorSenderCache", "vllm.multimodal.cache.MultiModalReceiverCache", "vllm.multimodal.cache.ShmObjectStoreReceiverCache", "vllm.multimodal.cache.ShmObjectStoreSenderCache", "vllm.multimodal.cache.logger" ], "n_typable": 110, "n_typed": 103, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 46, "n_method_overloads": 46, "n_method_params": 54, "n_classes": 11, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/multimodal/encoder_budget.py", "symbol_reports": [ { "kind": "class", "name": "vllm.multimodal.encoder_budget.MultiModalBudget", "methods": [ { "kind": "function", "name": "MultiModalBudget.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalBudget._get_max_items", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalBudget.get_modality_with_max_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiModalBudget.get_encoder_budget", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiModalBudget.reset_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalBudget.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalBudget.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalBudget.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalBudget.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalBudget.encoder_compute_budget", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalBudget.encoder_cache_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalBudget.mm_max_toks_per_item", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalBudget.mm_max_items_per_prompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalBudget.mm_max_items_per_batch", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalBudget.cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalBudget.processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalBudget.mm_limits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 11, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_attrs": 12, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.encoder_budget.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.multimodal.encoder_budget.get_mm_max_toks_per_item", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "type_ignores": [], "name": "vllm.multimodal.encoder_budget", "names": [ "vllm.multimodal.encoder_budget.MultiModalBudget", "vllm.multimodal.encoder_budget.get_mm_max_toks_per_item", "vllm.multimodal.encoder_budget.logger" ], "n_typable": 27, "n_typed": 16, "n_any": 0, "n_untyped": 11, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_classes": 1, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/multimodal/evs.py", "symbol_reports": [ { "kind": "function", "name": "vllm.multimodal.evs.recompute_mrope_positions", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.multimodal.evs.compute_mrope_for_media", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.multimodal.evs.compute_retention_mask", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.multimodal.evs.compute_retained_tokens_count", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.multimodal.evs", "names": [ "vllm.multimodal.evs.compute_mrope_for_media", "vllm.multimodal.evs.compute_retained_tokens_count", "vllm.multimodal.evs.compute_retention_mask", "vllm.multimodal.evs.recompute_mrope_positions" ], "n_typable": 22, "n_typed": 22, "n_any": 0, "n_untyped": 0, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 18, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/multimodal/image.py", "symbol_reports": [ { "kind": "function", "name": "vllm.multimodal.image.convert_image_mode", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.multimodal.image.rescale_image_size", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.multimodal.image.rgba_to_rgb", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.multimodal.image", "names": [ "vllm.multimodal.image.convert_image_mode", "vllm.multimodal.image.rescale_image_size", "vllm.multimodal.image.rgba_to_rgb" ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/multimodal/media/base.py", "symbol_reports": [ { "kind": "class", "name": "vllm.multimodal.media.base.MediaWithBytes", "methods": [ { "kind": "function", "name": "MediaWithBytes.__array__", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MediaWithBytes.__getstate__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MediaWithBytes.__setstate__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MediaWithBytes.__getattr__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MediaWithBytes.media", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MediaWithBytes.original_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 8, "n_typed": 3, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.media.base.MediaIO", "methods": [ { "kind": "function", "name": "MediaIO.load_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MediaIO.load_base64", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MediaIO.load_file", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.multimodal.media.base", "names": [ "vllm.multimodal.media.base.MediaIO", "vllm.multimodal.media.base.MediaWithBytes" ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 8, "n_classes": 2, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/multimodal/media/connector.py", "symbol_reports": [ { "kind": "class", "name": "vllm.multimodal.media.connector.MediaConnector", "methods": [ { "kind": "function", "name": "MediaConnector.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MediaConnector._load_data_url", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MediaConnector._load_file_url", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MediaConnector._assert_url_in_allowed_media_domains", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MediaConnector.load_from_url", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MediaConnector.load_from_url_async", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MediaConnector.fetch_audio", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MediaConnector.fetch_audio_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MediaConnector.fetch_image", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MediaConnector.fetch_image_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MediaConnector.fetch_video", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MediaConnector.fetch_video_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MediaConnector.fetch_image_embedding", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MediaConnector.fetch_audio_embedding", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MediaConnector.media_io_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MediaConnector.connection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MediaConnector.allowed_local_media_path", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MediaConnector.allowed_media_domains", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 45, "n_typed": 42, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 27, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.media.connector.MEDIA_CONNECTOR_REGISTRY", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.multimodal.media.connector.global_thread_pool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": [ "type-var" ] }, { "kind": "type", "rules": [ "type-var" ] }, { "kind": "type", "rules": [ "type-var" ] } ], "name": "vllm.multimodal.media.connector", "names": [ "vllm.multimodal.media.connector.MEDIA_CONNECTOR_REGISTRY", "vllm.multimodal.media.connector.MediaConnector", "vllm.multimodal.media.connector.global_thread_pool" ], "n_typable": 47, "n_typed": 42, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 27, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 3 }, { "path": "vllm/multimodal/video.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.multimodal.video.VIDEO_LOADER_REGISTRY", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.multimodal.video.sample_frames_from_video", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.multimodal.video.OpenCVVideoBackend", "methods": [ { "kind": "function", "name": "OpenCVVideoBackend.get_cv2_video_api", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OpenCVVideoBackend.load_bytes", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.multimodal.video.resize_video", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.multimodal.video.OpenCVDynamicOpenPanguVideoBackend", "methods": [ { "kind": "function", "name": "OpenCVDynamicOpenPanguVideoBackend.load_bytes", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.video.VideoLoader", "methods": [ { "kind": "function", "name": "VideoLoader.load_bytes", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VideoLoader._can_use_for_recovery", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "VideoLoader._read_frames_with_recovery", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VideoLoader._read_frames", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 14, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.video.OpenCVDynamicVideoBackend", "methods": [ { "kind": "function", "name": "OpenCVDynamicVideoBackend.load_bytes", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.video.Molmo2VideoBackend", "methods": [ { "kind": "function", "name": "Molmo2VideoBackend.get_cv2_video_api", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Molmo2VideoBackend.get_candidate_target_fps", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Molmo2VideoBackend.get_target_fps", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Molmo2VideoBackend.get_frame_times_and_chosen_fps", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Molmo2VideoBackend.sample_times", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Molmo2VideoBackend._sample_frames", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Molmo2VideoBackend.load_bytes_opencv", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Molmo2VideoBackend.load_bytes", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 42, "n_typed": 38, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 34, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.video.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.multimodal.video.rescale_video_size", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.multimodal.video", "names": [ "vllm.multimodal.video.Molmo2VideoBackend", "vllm.multimodal.video.OpenCVDynamicOpenPanguVideoBackend", "vllm.multimodal.video.OpenCVDynamicVideoBackend", "vllm.multimodal.video.OpenCVVideoBackend", "vllm.multimodal.video.VIDEO_LOADER_REGISTRY", "vllm.multimodal.video.VideoLoader", "vllm.multimodal.video.logger", "vllm.multimodal.video.rescale_video_size", "vllm.multimodal.video.resize_video", "vllm.multimodal.video.sample_frames_from_video" ], "n_typable": 93, "n_typed": 81, "n_any": 0, "n_untyped": 12, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 6, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 66, "n_classes": 5, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/multimodal/media/video.py", "symbol_reports": [ { "kind": "class", "name": "vllm.multimodal.media.video.VideoMediaIO", "methods": [ { "kind": "function", "name": "VideoMediaIO.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "VideoMediaIO.load_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VideoMediaIO.load_base64", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VideoMediaIO.load_file", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VideoMediaIO.encode_base64", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VideoMediaIO.image_io", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VideoMediaIO.num_frames", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VideoMediaIO.kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "VideoMediaIO.video_loader", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 13, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.multimodal.media.video", "names": [ "vllm.multimodal.media.video.VideoMediaIO" ], "n_typable": 18, "n_typed": 13, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/multimodal/media/audio.py", "symbol_reports": [ { "kind": "class", "name": "vllm.multimodal.media.audio.AudioMediaIO", "methods": [ { "kind": "function", "name": "AudioMediaIO.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioMediaIO.load_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioMediaIO.load_base64", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AudioMediaIO.load_file", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioMediaIO.encode_base64", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AudioMediaIO.kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 11, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 7, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.media.audio.AudioEmbeddingMediaIO", "methods": [ { "kind": "function", "name": "AudioEmbeddingMediaIO.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AudioEmbeddingMediaIO.load_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioEmbeddingMediaIO.load_base64", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AudioEmbeddingMediaIO.load_file", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioEmbeddingMediaIO.encode_base64", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.media.audio.soundfile", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.multimodal.media.audio.librosa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] } ], "name": "vllm.multimodal.media.audio", "names": [ "vllm.multimodal.media.audio.AudioEmbeddingMediaIO", "vllm.multimodal.media.audio.AudioMediaIO", "vllm.multimodal.media.audio.librosa", "vllm.multimodal.media.audio.soundfile" ], "n_typable": 25, "n_typed": 21, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 12, "n_classes": 2, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 2 }, { "path": "vllm/multimodal/media/image.py", "symbol_reports": [ { "kind": "class", "name": "vllm.multimodal.media.image.ImageMediaIO", "methods": [ { "kind": "function", "name": "ImageMediaIO.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ImageMediaIO._convert_image_mode", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ImageMediaIO.load_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ImageMediaIO.load_base64", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ImageMediaIO.load_file", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ImageMediaIO.encode_base64", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ImageMediaIO.image_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageMediaIO.kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageMediaIO.rgba_background_color", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 14, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.media.image.ImageEmbeddingMediaIO", "methods": [ { "kind": "function", "name": "ImageEmbeddingMediaIO.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ImageEmbeddingMediaIO.load_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ImageEmbeddingMediaIO.load_base64", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ImageEmbeddingMediaIO.load_file", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ImageEmbeddingMediaIO.encode_base64", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.multimodal.media.image", "names": [ "vllm.multimodal.media.image.ImageEmbeddingMediaIO", "vllm.multimodal.media.image.ImageMediaIO" ], "n_typable": 28, "n_typed": 24, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 14, "n_classes": 2, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/multimodal/parse.py", "symbol_reports": [ { "kind": "class", "name": "vllm.multimodal.parse.MultiModalDataParser", "methods": [ { "kind": "function", "name": "MultiModalDataParser.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MultiModalDataParser.is_embeddings", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalDataParser._get_audio_with_sr", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalDataParser._get_video_with_metadata", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalDataParser._parse_audio_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalDataParser._parse_image_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalDataParser._parse_video_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalDataParser._parse_vision_chunk_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalDataParser._get_subparsers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiModalDataParser.parse_mm_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalDataParser.audio_resampler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalDataParser.target_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalDataParser.video_needs_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MultiModalDataParser.expected_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 23, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 13, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.parse.ModalityDataItems", "methods": [ { "kind": "function", "name": "ModalityDataItems.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModalityDataItems.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModalityDataItems.__len__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModalityDataItems.__getitem__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModalityDataItems.__iter__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModalityDataItems.get_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModalityDataItems.get", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModalityDataItems.get_all", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModalityDataItems.get_item_for_hash", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModalityDataItems.get_all_items_for_hash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModalityDataItems.get_processor_data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModalityDataItems.get_passthrough_data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModalityDataItems.data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ModalityDataItems.modality", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.parse.VideoEmbeddingItems", "methods": [ { "kind": "function", "name": "VideoEmbeddingItems.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.parse.VideoProcessorItems", "methods": [ { "kind": "function", "name": "VideoProcessorItems.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "VideoProcessorItems.get_num_frames", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "VideoProcessorItems.get_frame_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VideoProcessorItems.metadata", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.parse.DictEmbeddingItems", "methods": [ { "kind": "function", "name": "DictEmbeddingItems.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DictEmbeddingItems.get_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DictEmbeddingItems.get", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DictEmbeddingItems.get_processor_data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DictEmbeddingItems.get_passthrough_data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DictEmbeddingItems.fields_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DictEmbeddingItems.required_fields", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 10, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.parse.ImageProcessorItems", "methods": [ { "kind": "function", "name": "ImageProcessorItems.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ImageProcessorItems.get_image_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.parse.ProcessorBatchItems", "methods": [ { "kind": "function", "name": "ProcessorBatchItems._unwrap", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ProcessorBatchItems.get_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ProcessorBatchItems.get", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ProcessorBatchItems.get_item_for_hash", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ProcessorBatchItems.get_processor_data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ProcessorBatchItems.get_passthrough_data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.multimodal.parse.parse_mm_uuids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.multimodal.parse.PILImage", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.multimodal.parse.AudioProcessorItems", "methods": [ { "kind": "function", "name": "AudioProcessorItems.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AudioProcessorItems.get_audio_length", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.parse.MultiModalDataItems", "methods": [ { "kind": "function", "name": "MultiModalDataItems.select", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiModalDataItems.get_count", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiModalDataItems.get_all_counts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiModalDataItems.get_items", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.parse.ModalityDataParser", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.multimodal.parse.AudioEmbeddingItems", "methods": [ { "kind": "function", "name": "AudioEmbeddingItems.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.parse.MultiModalUUIDItems", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.multimodal.parse.validate_embedding_ndim", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.multimodal.parse.ImageEmbeddingItems", "methods": [ { "kind": "function", "name": "ImageEmbeddingItems.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.parse.VisionChunkProcessorItems", "methods": [ { "kind": "function", "name": "VisionChunkProcessorItems.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.parse.EmbeddingItems", "methods": [ { "kind": "function", "name": "EmbeddingItems.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EmbeddingItems._validate_ndim", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EmbeddingItems._validate_hidden_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EmbeddingItems._unwrap", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EmbeddingItems.get_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EmbeddingItems.get", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EmbeddingItems.get_processor_data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EmbeddingItems.get_passthrough_data", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EmbeddingItems.get_feature_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.parse.ImageSize", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ImageSize.width", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ImageSize.height", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.multimodal.parse", "names": [ "vllm.multimodal.parse.AudioEmbeddingItems", "vllm.multimodal.parse.AudioProcessorItems", "vllm.multimodal.parse.DictEmbeddingItems", "vllm.multimodal.parse.EmbeddingItems", "vllm.multimodal.parse.ImageEmbeddingItems", "vllm.multimodal.parse.ImageProcessorItems", "vllm.multimodal.parse.ImageSize", "vllm.multimodal.parse.ModalityDataItems", "vllm.multimodal.parse.ModalityDataParser", "vllm.multimodal.parse.MultiModalDataItems", "vllm.multimodal.parse.MultiModalDataParser", "vllm.multimodal.parse.MultiModalUUIDItems", "vllm.multimodal.parse.PILImage", "vllm.multimodal.parse.ProcessorBatchItems", "vllm.multimodal.parse.VideoEmbeddingItems", "vllm.multimodal.parse.VideoProcessorItems", "vllm.multimodal.parse.VisionChunkProcessorItems", "vllm.multimodal.parse.parse_mm_uuids", "vllm.multimodal.parse.validate_embedding_ndim" ], "n_typable": 128, "n_typed": 118, "n_any": 0, "n_untyped": 10, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 4, "n_methods": 57, "n_method_overloads": 57, "n_method_params": 53, "n_classes": 14, "n_attrs": 14, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/multimodal/processing/context.py", "symbol_reports": [ { "kind": "class", "name": "vllm.multimodal.processing.context.InputProcessingContext", "methods": [ { "kind": "function", "name": "InputProcessingContext.get_tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InputProcessingContext.get_hf_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "function", "name": "InputProcessingContext.get_hf_image_processor_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InputProcessingContext.get_mm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InputProcessingContext.get_hf_processor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 3, "n_params": 2, "n_function_overloads": 2, "n_function_params": 2 }, { "kind": "function", "name": "InputProcessingContext.init_processor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputProcessingContext._postprocess_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InputProcessingContext.get_merged_mm_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InputProcessingContext.call_hf_processor", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InputProcessingContext.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputProcessingContext.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 21, "n_typed": 19, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 11, "n_method_params": 12, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.processing.context.TimingContext", "methods": [ { "kind": "function", "name": "TimingContext.record", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TimingContext.get_stats_dict", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "TimingContext.total_secs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "TimingContext.enabled", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TimingContext.stage_secs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 2, "n_properties": 1 }, { "kind": "class", "name": "vllm.multimodal.processing.context.BaseProcessingInfo", "methods": [ { "kind": "function", "name": "BaseProcessingInfo.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseProcessingInfo.get_tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseProcessingInfo.get_hf_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseProcessingInfo.get_hf_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseProcessingInfo.get_default_tok_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseProcessingInfo._get_expected_hidden_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseProcessingInfo.get_data_parser", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseProcessingInfo.get_supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseProcessingInfo.validate_num_items", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseProcessingInfo.parse_mm_data", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseProcessingInfo.get_mm_max_tokens_per_item", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "BaseProcessingInfo.model_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "BaseProcessingInfo.default_tok_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "BaseProcessingInfo.data_parser", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "BaseProcessingInfo.skip_prompt_length_check", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "BaseProcessingInfo.supported_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "BaseProcessingInfo.allowed_mm_limits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "BaseProcessingInfo.ctx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 25, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 8, "n_attrs": 1, "n_properties": 6 }, { "kind": "attr", "name": "vllm.multimodal.processing.context.PretrainedConfig", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.multimodal.processing.context.BatchFeature", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.multimodal.processing.context.ProcessorMixin", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.multimodal.processing.context.ModelConfig", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.multimodal.processing.context.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.multimodal.processing.context", "names": [ "vllm.multimodal.processing.context.BaseProcessingInfo", "vllm.multimodal.processing.context.BatchFeature", "vllm.multimodal.processing.context.InputProcessingContext", "vllm.multimodal.processing.context.ModelConfig", "vllm.multimodal.processing.context.PretrainedConfig", "vllm.multimodal.processing.context.ProcessorMixin", "vllm.multimodal.processing.context.TimingContext", "vllm.multimodal.processing.context.logger" ], "n_typable": 52, "n_typed": 46, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 22, "n_method_overloads": 24, "n_method_params": 21, "n_classes": 3, "n_attrs": 10, "n_properties": 7, "n_type_ignores": 0 }, { "path": "vllm/multimodal/processing/processor.py", "symbol_reports": [ { "kind": "class", "name": "vllm.multimodal.processing.processor.PromptUpdate", "methods": [ { "kind": "function", "name": "PromptUpdate._resolve_target", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PromptUpdate._resolve_content", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PromptUpdate.resolve", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "PromptUpdate.content", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PromptUpdate.mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "PromptUpdate.modality", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PromptUpdate.target", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 2, "n_properties": 2 }, { "kind": "class", "name": "vllm.multimodal.processing.processor.EncDecMultiModalProcessor", "methods": [ { "kind": "function", "name": "EncDecMultiModalProcessor.create_encoder_prompt", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EncDecMultiModalProcessor.create_decoder_prompt", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EncDecMultiModalProcessor._get_enc_dec_inputs", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EncDecMultiModalProcessor.apply", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 13, "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.processing.processor.PromptIndexTargets", "methods": [ { "kind": "function", "name": "PromptIndexTargets.start", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PromptIndexTargets.prefix", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PromptIndexTargets.end", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.processing.processor.PromptInsertion", "methods": [], "properties": [ { "kind": "property", "name": "PromptInsertion.content", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PromptInsertion.mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "PromptInsertion.insertion", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 2 }, { "kind": "class", "name": "vllm.multimodal.processing.processor.PromptUpdateDetails", "methods": [ { "kind": "function", "name": "PromptUpdateDetails.from_seq", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PromptUpdateDetails.select_text", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PromptUpdateDetails.select_token_id", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PromptUpdateDetails.select_token_ids", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PromptUpdateDetails.full", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PromptUpdateDetails.is_embed", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.processing.processor.PromptReplacement", "methods": [], "properties": [ { "kind": "property", "name": "PromptReplacement.content", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PromptReplacement.mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "PromptReplacement.replacement", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 2 }, { "kind": "class", "name": "vllm.multimodal.processing.processor.BaseMultiModalProcessor", "methods": [ { "kind": "function", "name": "BaseMultiModalProcessor.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseMultiModalProcessor.__call__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaseMultiModalProcessor._get_mm_fields_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalProcessor._get_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseMultiModalProcessor._bind_and_group_updates", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalProcessor._get_mm_prompt_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseMultiModalProcessor._find_mm_placeholders", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalProcessor._get_hf_mm_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseMultiModalProcessor._call_hf_processor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaseMultiModalProcessor._hf_processor_applies_updates", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaseMultiModalProcessor._apply_hf_processor_text_mm", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaseMultiModalProcessor._apply_hf_processor_text_only", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalProcessor._apply_hf_processor_tokens_only", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseMultiModalProcessor._apply_hf_processor_mm_only", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseMultiModalProcessor._apply_hf_processor_main", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BaseMultiModalProcessor._get_cache_missing_items", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseMultiModalProcessor._recompute_cached_prompt_update", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalProcessor._merge_mm_kwargs", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BaseMultiModalProcessor._apply_hf_processor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalProcessor._cached_apply_hf_processor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalProcessor._apply_token_matches", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalProcessor._apply_text_matches", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalProcessor._apply_prompt_updates", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalProcessor._validate_mm_kwargs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalProcessor._validate_mm_updates", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalProcessor._validate_mm_placeholders", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMultiModalProcessor._maybe_apply_prompt_updates", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BaseMultiModalProcessor.apply", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseMultiModalProcessor.info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseMultiModalProcessor.dummy_inputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseMultiModalProcessor.cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseMultiModalProcessor.data_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 108, "n_typed": 104, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 28, "n_method_overloads": 28, "n_method_params": 76, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.multimodal.processing.processor.UpdateMode", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "UpdateMode.INSERT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UpdateMode.REPLACE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.multimodal.processing.processor.full_groupby_modality", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.multimodal.processing.processor.replace_token_matches", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.multimodal.processing.processor.PromptTargetMatch", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PromptTargetMatch.start_idx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PromptTargetMatch.end_idx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.processing.processor.UpdateTarget", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.multimodal.processing.processor.MultiModalPromptUpdatesApplyResult", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.multimodal.processing.processor.MultiModalIsCached", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.multimodal.processing.processor.MultiModalProcessingInfo", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiModalProcessingInfo.kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModalProcessingInfo.hashes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MultiModalProcessingInfo.prompt_updates", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.processing.processor.BaseMultiModalProcessorCache", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.multimodal.processing.processor.PromptSeq", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.multimodal.processing.processor.PromptIndex", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PromptIndex.get_match_index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.processing.processor.PromptUpdateInfo", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.multimodal.processing.processor.MultiModalPromptUpdates", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.multimodal.processing.processor.iter_token_matches", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.multimodal.processing.processor.PlaceholderFeaturesInfo", "methods": [ { "kind": "function", "name": "PlaceholderFeaturesInfo.to_range", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "PlaceholderFeaturesInfo.length", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "PlaceholderFeaturesInfo.modality", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PlaceholderFeaturesInfo.item_idx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PlaceholderFeaturesInfo.start_idx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PlaceholderFeaturesInfo.tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PlaceholderFeaturesInfo.is_embed", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 5, "n_properties": 1 }, { "kind": "function", "name": "vllm.multimodal.processing.processor.find_mm_placeholders", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.multimodal.processing.processor.ResolvedPromptUpdate", "methods": [ { "kind": "function", "name": "ResolvedPromptUpdate.iter_token_matches", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ResolvedPromptUpdate.iter_text_matches", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ResolvedPromptUpdate.iter_matches", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ResolvedPromptUpdate.with_target", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ResolvedPromptUpdate.with_content", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ResolvedPromptUpdate.modality", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ResolvedPromptUpdate.item_idx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ResolvedPromptUpdate.mode", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ResolvedPromptUpdate.target", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ResolvedPromptUpdate.content", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 16, "n_typed": 14, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 11, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.processing.processor.BatchFeature", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.multimodal.processing.processor.PromptUpdateTarget", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.multimodal.processing.processor.PromptUpdateContent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.multimodal.processing.processor.apply_text_matches", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.multimodal.processing.processor.apply_token_matches", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.multimodal.processing.processor.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.multimodal.processing.processor", "names": [ "vllm.multimodal.processing.processor.BaseMultiModalProcessor", "vllm.multimodal.processing.processor.BaseMultiModalProcessorCache", "vllm.multimodal.processing.processor.BatchFeature", "vllm.multimodal.processing.processor.EncDecMultiModalProcessor", "vllm.multimodal.processing.processor.MultiModalIsCached", "vllm.multimodal.processing.processor.MultiModalProcessingInfo", "vllm.multimodal.processing.processor.MultiModalPromptUpdates", "vllm.multimodal.processing.processor.MultiModalPromptUpdatesApplyResult", "vllm.multimodal.processing.processor.PlaceholderFeaturesInfo", "vllm.multimodal.processing.processor.PromptIndex", "vllm.multimodal.processing.processor.PromptIndexTargets", "vllm.multimodal.processing.processor.PromptInsertion", "vllm.multimodal.processing.processor.PromptReplacement", "vllm.multimodal.processing.processor.PromptSeq", "vllm.multimodal.processing.processor.PromptTargetMatch", "vllm.multimodal.processing.processor.PromptUpdate", "vllm.multimodal.processing.processor.PromptUpdateContent", "vllm.multimodal.processing.processor.PromptUpdateDetails", "vllm.multimodal.processing.processor.PromptUpdateInfo", "vllm.multimodal.processing.processor.PromptUpdateTarget", "vllm.multimodal.processing.processor.ResolvedPromptUpdate", "vllm.multimodal.processing.processor.UpdateMode", "vllm.multimodal.processing.processor.UpdateTarget", "vllm.multimodal.processing.processor.apply_text_matches", "vllm.multimodal.processing.processor.apply_token_matches", "vllm.multimodal.processing.processor.find_mm_placeholders", "vllm.multimodal.processing.processor.full_groupby_modality", "vllm.multimodal.processing.processor.iter_token_matches", "vllm.multimodal.processing.processor.logger", "vllm.multimodal.processing.processor.replace_token_matches" ], "n_typable": 196, "n_typed": 188, "n_any": 0, "n_untyped": 8, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 16, "n_methods": 48, "n_method_overloads": 48, "n_method_params": 107, "n_classes": 13, "n_attrs": 39, "n_properties": 7, "n_type_ignores": 0 }, { "path": "vllm/multimodal/processing/dummy_inputs.py", "symbol_reports": [ { "kind": "class", "name": "vllm.multimodal.processing.dummy_inputs.BaseDummyInputsBuilder", "methods": [ { "kind": "function", "name": "BaseDummyInputsBuilder.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseDummyInputsBuilder.get_dummy_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseDummyInputsBuilder.get_dummy_mm_data", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseDummyInputsBuilder.get_dummy_processor_inputs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseDummyInputsBuilder._get_dummy_audios", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseDummyInputsBuilder._get_dummy_images", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaseDummyInputsBuilder._get_dummy_videos", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseDummyInputsBuilder.info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 27, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 20, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.multimodal.processing.dummy_inputs.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.multimodal.processing.dummy_inputs", "names": [ "vllm.multimodal.processing.dummy_inputs.BaseDummyInputsBuilder", "vllm.multimodal.processing.dummy_inputs.logger" ], "n_typable": 29, "n_typed": 27, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 20, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/multimodal/processing/inputs.py", "symbol_reports": [ { "kind": "class", "name": "vllm.multimodal.processing.inputs.ProcessorInputs", "methods": [ { "kind": "function", "name": "ProcessorInputs.get_mm_hashes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ProcessorInputs.prompt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ProcessorInputs.mm_data_items", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ProcessorInputs.mm_uuid_items", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ProcessorInputs.hf_processor_mm_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ProcessorInputs.tokenization_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.multimodal.processing.inputs", "names": [ "vllm.multimodal.processing.inputs.ProcessorInputs" ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_classes": 1, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/multimodal/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.multimodal.utils.encode_image_base64", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.multimodal.utils.fetch_image", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.multimodal.utils.fetch_audio", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.multimodal.utils.group_mm_kwargs_by_modality", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.multimodal.utils.torch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.multimodal.utils.encode_video_url", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.multimodal.utils.fetch_video", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.multimodal.utils.encode_audio_url", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.multimodal.utils.group_and_batch_mm_items", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.multimodal.utils.argsort_mm_positions", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.multimodal.utils.encode_image_url", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.multimodal.utils.encode_video_base64", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.multimodal.utils.encode_audio_base64", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.multimodal.utils", "names": [ "vllm.multimodal.utils.argsort_mm_positions", "vllm.multimodal.utils.encode_audio_base64", "vllm.multimodal.utils.encode_audio_url", "vllm.multimodal.utils.encode_image_base64", "vllm.multimodal.utils.encode_image_url", "vllm.multimodal.utils.encode_video_base64", "vllm.multimodal.utils.encode_video_url", "vllm.multimodal.utils.fetch_audio", "vllm.multimodal.utils.fetch_image", "vllm.multimodal.utils.fetch_video", "vllm.multimodal.utils.group_and_batch_mm_items", "vllm.multimodal.utils.group_mm_kwargs_by_modality", "vllm.multimodal.utils.torch" ], "n_typable": 42, "n_typed": 41, "n_any": 0, "n_untyped": 1, "n_functions": 12, "n_function_overloads": 12, "n_function_params": 29, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/parser/abstract_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.parser.abstract_parser._WrappedParser", "methods": [ { "kind": "function", "name": "_WrappedParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "_WrappedParser.reasoning_parser_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "_WrappedParser.tool_parser_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.parser.abstract_parser.Parser", "methods": [ { "kind": "function", "name": "Parser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Parser.is_reasoning_end", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Parser.is_reasoning_end_streaming", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Parser.extract_content_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Parser.extract_response_outputs", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Parser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Parser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Parser.adjust_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Parser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Parser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [ { "kind": "property", "name": "Parser.vocab", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Parser.reasoning_parser", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_typable": 2 }, { "kind": "property", "name": "Parser.tool_parser", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_typable": 2 } ], "attrs": [ { "kind": "attr", "name": "Parser.reasoning_parser_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Parser.tool_parser_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Parser.model_tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 48, "n_typed": 44, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 30, "n_attrs": 3, "n_properties": 3 }, { "kind": "class", "name": "vllm.parser.abstract_parser.DelegatingParser", "methods": [ { "kind": "function", "name": "DelegatingParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DelegatingParser.extract_response_outputs", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DelegatingParser._parse_tool_calls", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DelegatingParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "DelegatingParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DelegatingParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [], "n_typable": 31, "n_typed": 31, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 25, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.parser.abstract_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.parser.abstract_parser", "names": [ "vllm.parser.abstract_parser.DelegatingParser", "vllm.parser.abstract_parser.Parser", "vllm.parser.abstract_parser._WrappedParser", "vllm.parser.abstract_parser.logger" ], "n_typable": 84, "n_typed": 78, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 56, "n_classes": 3, "n_attrs": 6, "n_properties": 3, "n_type_ignores": 0 }, { "path": "vllm/parser/parser_manager.py", "symbol_reports": [ { "kind": "class", "name": "vllm.parser.parser_manager.ParserManager", "methods": [ { "kind": "function", "name": "ParserManager.get_parser_internal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParserManager._load_lazy_parser", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParserManager._register_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ParserManager.register_lazy_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ParserManager.register_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ParserManager.list_registered", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParserManager.import_parser", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParserManager.get_tool_parser", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ParserManager.get_reasoning_parser", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParserManager.get_parser", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ParserManager.parsers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParserManager.lazy_parsers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 32, "n_typed": 32, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 20, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.parser.parser_manager.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.parser.parser_manager", "names": [ "vllm.parser.parser_manager.ParserManager", "vllm.parser.parser_manager.logger" ], "n_typable": 33, "n_typed": 32, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 20, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/parser/minimax_m2_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.parser.minimax_m2_parser.MiniMaxM2Parser", "methods": [ { "kind": "function", "name": "MiniMaxM2Parser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxM2Parser.reasoning_parser_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MiniMaxM2Parser.tool_parser_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.parser.minimax_m2_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.parser.minimax_m2_parser", "names": [ "vllm.parser.minimax_m2_parser.MiniMaxM2Parser", "vllm.parser.minimax_m2_parser.logger" ], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/platforms/interface.py", "symbol_reports": [ { "kind": "class", "name": "vllm.platforms.interface.Platform", "methods": [ { "kind": "function", "name": "Platform.is_cuda", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.is_rocm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.is_tpu", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.is_xpu", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.is_cpu", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.is_out_of_tree", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.is_unspecified", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.get_max_output_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.is_cuda_alike", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.is_sleep_mode_available", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.get_pass_manager_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.get_compile_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.device_id_to_physical_device_id", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.import_kernels", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.get_attn_backend_cls", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Platform.get_supported_vit_attn_backends", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.get_vit_attn_backend", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Platform.get_device_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.has_device_capability", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Platform.is_device_capability", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Platform.is_device_capability_family", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Platform.get_device_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.get_device_uuid", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.get_device_total_memory", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.inference_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.set_device", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.pre_register_and_update", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.apply_config_platform_defaults", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.check_and_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.verify_model_arch", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.verify_quantization", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.get_cpu_architecture", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.is_pin_memory_available", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.get_current_memory_usage", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.get_punica_wrapper", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.get_infinity_values", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.can_update_inplace", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.get_lora_vocab_padding_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.get_device_communicator_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.supports_mx", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.supports_fp8", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.is_fp8_fnuz", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.fp8_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.use_all_gather", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.use_custom_allreduce", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.opaque_attention_op", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.validate_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Platform.__getattr__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.get_global_graph_pool", "n_typed": 0, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.get_static_graph_wrapper_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.stateless_init_device_torch_dist_pg", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Platform.check_if_supports_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.support_hybrid_kv_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.support_static_graph_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.use_sync_weight_loader", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.make_synced_weight_loader", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.get_nixl_supported_devices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.get_nixl_memory_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Platform.check_max_model_len", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Platform.set_additional_forward_context", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Platform.num_compute_units", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Platform.pass_key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Platform.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Platform._enum", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Platform.device_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Platform.device_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Platform.dispatch_key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Platform.ray_device_key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Platform.device_control_env_var", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Platform.ray_noset_device_env_vars", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Platform.simple_compile_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Platform.dist_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Platform.supported_quantization", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Platform.additional_env_vars", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Platform._global_graph_pool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 115, "n_typed": 106, "n_any": 1, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 61, "n_method_overloads": 61, "n_method_params": 40, "n_attrs": 12, "n_properties": 2 }, { "kind": "class", "name": "vllm.platforms.interface.PlatformEnum", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PlatformEnum.CUDA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PlatformEnum.ROCM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PlatformEnum.TPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PlatformEnum.XPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PlatformEnum.CPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PlatformEnum.OOT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PlatformEnum.UNSPECIFIED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.platforms.interface.CpuArchEnum", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CpuArchEnum.X86", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CpuArchEnum.ARM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CpuArchEnum.POWERPC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CpuArchEnum.S390X", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CpuArchEnum.RISCV", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CpuArchEnum.OTHER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CpuArchEnum.UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "function", "name": "vllm.platforms.interface.in_wsl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.platforms.interface.FlexibleArgumentParser", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.platforms.interface.DeviceCapability", "methods": [ { "kind": "function", "name": "DeviceCapability.__lt__", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeviceCapability.__le__", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeviceCapability.__eq__", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeviceCapability.__ge__", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeviceCapability.__gt__", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeviceCapability.as_version_str", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeviceCapability.to_int", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeviceCapability.major", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeviceCapability.minor", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 12, "n_typed": 7, "n_any": 5, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.platforms.interface.UnspecifiedPlatform", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "UnspecifiedPlatform._enum", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UnspecifiedPlatform.device_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.platforms.interface.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.platforms.interface", "names": [ "vllm.platforms.interface.CpuArchEnum", "vllm.platforms.interface.DeviceCapability", "vllm.platforms.interface.FlexibleArgumentParser", "vllm.platforms.interface.Platform", "vllm.platforms.interface.PlatformEnum", "vllm.platforms.interface.UnspecifiedPlatform", "vllm.platforms.interface.in_wsl", "vllm.platforms.interface.logger" ], "n_typable": 129, "n_typed": 114, "n_any": 6, "n_untyped": 9, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 68, "n_method_overloads": 68, "n_method_params": 45, "n_classes": 5, "n_attrs": 32, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/platforms/__init__.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.platforms._init_trace", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.platforms.current_platform", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.platforms", "names": [ "vllm.platforms._init_trace", "vllm.platforms.current_platform" ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/platforms/cpu.py", "symbol_reports": [ { "kind": "function", "name": "vllm.platforms.cpu.get_max_threads", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.platforms.cpu.VllmConfig", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.platforms.cpu.CpuPlatform", "methods": [ { "kind": "function", "name": "CpuPlatform.get_device_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CpuPlatform.get_attn_backend_cls", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CpuPlatform.get_device_total_memory", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CpuPlatform.set_device", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CpuPlatform.inference_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CpuPlatform.check_and_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CpuPlatform.get_allowed_cpu_core_node_list", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CpuPlatform.discover_numa_topology", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CpuPlatform.is_pin_memory_available", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CpuPlatform.get_punica_wrapper", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CpuPlatform.get_device_communicator_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CpuPlatform.supports_structured_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CpuPlatform.opaque_attention_op", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CpuPlatform.support_hybrid_kv_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CpuPlatform.import_kernels", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "CpuPlatform.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "CpuPlatform._enum", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CpuPlatform.device_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CpuPlatform.device_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CpuPlatform.dispatch_key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CpuPlatform.dist_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CpuPlatform.device_control_env_var", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 27, "n_typed": 26, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 7, "n_attrs": 6, "n_properties": 1 }, { "kind": "class", "name": "vllm.platforms.cpu.LogicalCPUInfo", "methods": [ { "kind": "function", "name": "LogicalCPUInfo._int", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LogicalCPUInfo.json_decoder", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LogicalCPUInfo.id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LogicalCPUInfo.physical_core", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LogicalCPUInfo.numa_node", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.platforms.cpu.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.platforms.cpu", "names": [ "vllm.platforms.cpu.CpuPlatform", "vllm.platforms.cpu.LogicalCPUInfo", "vllm.platforms.cpu.VllmConfig", "vllm.platforms.cpu.get_max_threads", "vllm.platforms.cpu.logger" ], "n_typable": 34, "n_typed": 29, "n_any": 0, "n_untyped": 5, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 9, "n_classes": 2, "n_attrs": 11, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/platforms/cuda.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.platforms.cuda.nvml_available", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.platforms.cuda.CudaPlatformBase", "methods": [ { "kind": "function", "name": "CudaPlatformBase.set_device", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaPlatformBase.get_device_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaPlatformBase.get_device_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaPlatformBase.get_device_total_memory", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaPlatformBase.is_fully_connected", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaPlatformBase.log_warnings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaPlatformBase.check_and_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaPlatformBase.get_current_memory_usage", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaPlatformBase.get_valid_backends", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CudaPlatformBase.get_attn_backend_cls", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CudaPlatformBase.get_supported_vit_attn_backends", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaPlatformBase.get_vit_attn_backend", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CudaPlatformBase.get_punica_wrapper", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaPlatformBase.get_device_communicator_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaPlatformBase.supports_fp8", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaPlatformBase.use_custom_allreduce", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaPlatformBase.opaque_attention_op", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaPlatformBase.get_static_graph_wrapper_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaPlatformBase.stateless_init_device_torch_dist_pg", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CudaPlatformBase.device_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaPlatformBase.check_if_supports_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaPlatformBase.insert_blocks_to_device", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CudaPlatformBase.swap_out_blocks_to_host", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CudaPlatformBase.support_hybrid_kv_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaPlatformBase.support_static_graph_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaPlatformBase.num_compute_units", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "CudaPlatformBase.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "CudaPlatformBase._enum", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CudaPlatformBase.device_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudaPlatformBase.device_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudaPlatformBase.dispatch_key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudaPlatformBase.ray_device_key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudaPlatformBase.dist_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudaPlatformBase.device_control_env_var", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudaPlatformBase.ray_noset_device_env_vars", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 65, "n_typed": 61, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 26, "n_method_overloads": 26, "n_method_params": 31, "n_attrs": 8, "n_properties": 1 }, { "kind": "attr", "name": "vllm.platforms.cuda.pynvml", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.platforms.cuda.with_nvml_context", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.platforms.cuda.CacheDType", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.platforms.cuda.NvmlCudaPlatform", "methods": [ { "kind": "function", "name": "NvmlCudaPlatform.get_device_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NvmlCudaPlatform.has_device_capability", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "NvmlCudaPlatform.get_device_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NvmlCudaPlatform.get_device_uuid", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NvmlCudaPlatform.get_device_total_memory", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NvmlCudaPlatform.is_fully_connected", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NvmlCudaPlatform._get_physical_device_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NvmlCudaPlatform.log_warnings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 16, "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.platforms.cuda.VllmConfig", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.platforms.cuda.NonNvmlCudaPlatform", "methods": [ { "kind": "function", "name": "NonNvmlCudaPlatform.get_device_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NonNvmlCudaPlatform.get_device_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NonNvmlCudaPlatform.get_device_total_memory", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NonNvmlCudaPlatform.is_fully_connected", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.platforms.cuda.CudaPlatform", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.platforms.cuda.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.platforms.cuda", "names": [ "vllm.platforms.cuda.CacheDType", "vllm.platforms.cuda.CudaPlatform", "vllm.platforms.cuda.CudaPlatformBase", "vllm.platforms.cuda.NonNvmlCudaPlatform", "vllm.platforms.cuda.NvmlCudaPlatform", "vllm.platforms.cuda.VllmConfig", "vllm.platforms.cuda.logger", "vllm.platforms.cuda.nvml_available", "vllm.platforms.cuda.pynvml", "vllm.platforms.cuda.with_nvml_context" ], "n_typable": 93, "n_typed": 86, "n_any": 0, "n_untyped": 7, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 38, "n_method_overloads": 38, "n_method_params": 43, "n_classes": 3, "n_attrs": 14, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/platforms/rocm.py", "symbol_reports": [ { "kind": "function", "name": "vllm.platforms.rocm.use_rocm_custom_paged_attention", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.platforms.rocm.on_gfx942", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.platforms.rocm.on_mi3xx", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.platforms.rocm.on_gfx1x", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.platforms.rocm.flash_attn_triton_available", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.platforms.rocm.on_gfx9", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.platforms.rocm.with_amdsmi_context", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.platforms.rocm.RocmPlatform", "methods": [ { "kind": "function", "name": "RocmPlatform.import_kernels", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmPlatform.get_attn_backend_cls", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RocmPlatform.get_supported_vit_attn_backends", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmPlatform.get_vit_attn_backend", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RocmPlatform.set_device", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmPlatform.get_device_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmPlatform.is_fully_connected", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmPlatform.get_device_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmPlatform.get_device_total_memory", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmPlatform.apply_config_platform_defaults", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmPlatform.check_and_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmPlatform.verify_model_arch", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmPlatform.verify_quantization", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmPlatform.get_punica_wrapper", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmPlatform.get_current_memory_usage", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmPlatform.get_device_communicator_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmPlatform.supports_mx", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmPlatform.supports_fp8", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmPlatform.is_fp8_fnuz", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmPlatform.fp8_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmPlatform.use_custom_allreduce", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmPlatform.opaque_attention_op", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmPlatform.is_navi", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmPlatform.get_static_graph_wrapper_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmPlatform.stateless_init_device_torch_dist_pg", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "RocmPlatform.device_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmPlatform.check_if_supports_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmPlatform.support_hybrid_kv_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmPlatform.support_static_graph_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmPlatform.num_compute_units", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RocmPlatform._enum", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RocmPlatform.device_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RocmPlatform.device_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RocmPlatform.dispatch_key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RocmPlatform.ray_device_key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RocmPlatform.dist_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RocmPlatform.device_control_env_var", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RocmPlatform.ray_noset_device_env_vars", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RocmPlatform.supported_quantization", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 61, "n_typed": 58, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 30, "n_method_overloads": 30, "n_method_params": 23, "n_attrs": 9, "n_properties": 0 }, { "kind": "attr", "name": "vllm.platforms.rocm.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.platforms.rocm.on_gfx950", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.platforms.rocm", "names": [ "vllm.platforms.rocm.RocmPlatform", "vllm.platforms.rocm.flash_attn_triton_available", "vllm.platforms.rocm.logger", "vllm.platforms.rocm.on_gfx1x", "vllm.platforms.rocm.on_gfx9", "vllm.platforms.rocm.on_gfx942", "vllm.platforms.rocm.on_gfx950", "vllm.platforms.rocm.on_mi3xx", "vllm.platforms.rocm.use_rocm_custom_paged_attention", "vllm.platforms.rocm.with_amdsmi_context" ], "n_typable": 80, "n_typed": 74, "n_any": 0, "n_untyped": 6, "n_functions": 8, "n_function_overloads": 8, "n_function_params": 10, "n_methods": 30, "n_method_overloads": 30, "n_method_params": 23, "n_classes": 1, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/platforms/tpu.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.platforms.tpu.USE_TPU_INFERENCE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.platforms.tpu.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": null } ], "name": "vllm.platforms.tpu", "names": [ "vllm.platforms.tpu.USE_TPU_INFERENCE", "vllm.platforms.tpu.logger" ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/platforms/xpu.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.platforms.xpu.VllmConfig", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.platforms.xpu.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.platforms.xpu.XPUPlatform", "methods": [ { "kind": "function", "name": "XPUPlatform.import_kernels", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUPlatform.get_attn_backend_cls", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "XPUPlatform.get_supported_vit_attn_backends", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUPlatform.get_vit_attn_backend", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "XPUPlatform.set_device", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XPUPlatform.get_device_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XPUPlatform.get_device_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XPUPlatform.get_punica_wrapper", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUPlatform.get_device_total_memory", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XPUPlatform.inference_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUPlatform.get_static_graph_wrapper_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUPlatform.check_and_update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XPUPlatform.support_hybrid_kv_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUPlatform.support_static_graph_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUPlatform.is_pin_memory_available", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUPlatform.get_current_memory_usage", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XPUPlatform.fp8_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUPlatform.is_data_center_gpu", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUPlatform.get_device_communicator_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUPlatform.device_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUPlatform.check_if_supports_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XPUPlatform.opaque_attention_op", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XPUPlatform.insert_blocks_to_device", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "XPUPlatform.swap_out_blocks_to_host", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "XPUPlatform.num_compute_units", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "XPUPlatform._enum", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "XPUPlatform.device_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "XPUPlatform.device_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "XPUPlatform.dispatch_key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "XPUPlatform.ray_device_key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "XPUPlatform.dist_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "XPUPlatform.device_control_env_var", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 53, "n_typed": 50, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 25, "n_method_overloads": 25, "n_method_params": 22, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.platforms.xpu", "names": [ "vllm.platforms.xpu.VllmConfig", "vllm.platforms.xpu.XPUPlatform", "vllm.platforms.xpu.logger" ], "n_typable": 54, "n_typed": 50, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 25, "n_method_overloads": 25, "n_method_params": 22, "n_classes": 1, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/plugins/__init__.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.plugins.plugins_loaded", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.plugins.IO_PROCESSOR_PLUGINS_GROUP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.plugins.load_general_plugins", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.plugins.load_plugins_by_group", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.plugins.PLATFORM_PLUGINS_GROUP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.plugins.DEFAULT_PLUGINS_GROUP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.plugins.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.plugins.STAT_LOGGER_PLUGINS_GROUP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.plugins", "names": [ "vllm.plugins.DEFAULT_PLUGINS_GROUP", "vllm.plugins.IO_PROCESSOR_PLUGINS_GROUP", "vllm.plugins.PLATFORM_PLUGINS_GROUP", "vllm.plugins.STAT_LOGGER_PLUGINS_GROUP", "vllm.plugins.load_general_plugins", "vllm.plugins.load_plugins_by_group", "vllm.plugins.logger", "vllm.plugins.plugins_loaded" ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/plugins/io_processors/__init__.py", "symbol_reports": [ { "kind": "function", "name": "vllm.plugins.io_processors.get_io_processor", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.plugins.io_processors.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.plugins.io_processors", "names": [ "vllm.plugins.io_processors.get_io_processor", "vllm.plugins.io_processors.logger" ], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/plugins/io_processors/interface.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.plugins.io_processors.interface.IOProcessorInput", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.plugins.io_processors.interface.IOProcessor", "methods": [ { "kind": "function", "name": "IOProcessor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "IOProcessor.parse_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IOProcessor.merge_sampling_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IOProcessor.merge_pooling_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IOProcessor.pre_process", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "IOProcessor.pre_process_async", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "IOProcessor.post_process", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "IOProcessor.post_process_async", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "IOProcessor.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 20, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 17, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.plugins.io_processors.interface.IOProcessorOutput", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.plugins.io_processors.interface", "names": [ "vllm.plugins.io_processors.interface.IOProcessor", "vllm.plugins.io_processors.interface.IOProcessorInput", "vllm.plugins.io_processors.interface.IOProcessorOutput" ], "n_typable": 26, "n_typed": 20, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 17, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/plugins/lora_resolvers/filesystem_resolver.py", "symbol_reports": [ { "kind": "class", "name": "vllm.plugins.lora_resolvers.filesystem_resolver.FilesystemResolver", "methods": [ { "kind": "function", "name": "FilesystemResolver.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FilesystemResolver.resolve_lora", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FilesystemResolver._get_lora_req_from_path", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FilesystemResolver.lora_cache_dir", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.plugins.lora_resolvers.filesystem_resolver.register_filesystem_resolver", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.plugins.lora_resolvers.filesystem_resolver", "names": [ "vllm.plugins.lora_resolvers.filesystem_resolver.FilesystemResolver", "vllm.plugins.lora_resolvers.filesystem_resolver.register_filesystem_resolver" ], "n_typable": 11, "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/plugins/lora_resolvers/hf_hub_resolver.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.plugins.lora_resolvers.hf_hub_resolver.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.plugins.lora_resolvers.hf_hub_resolver.register_hf_hub_resolver", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.plugins.lora_resolvers.hf_hub_resolver.HfHubResolver", "methods": [ { "kind": "function", "name": "HfHubResolver.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HfHubResolver.resolve_lora", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HfHubResolver._resolve_repo", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HfHubResolver._resolve_repo_subpath", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HfHubResolver._get_adapter_dirs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HfHubResolver.repo_list", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HfHubResolver.adapter_dirs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 14, "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.plugins.lora_resolvers.hf_hub_resolver", "names": [ "vllm.plugins.lora_resolvers.hf_hub_resolver.HfHubResolver", "vllm.plugins.lora_resolvers.hf_hub_resolver.logger", "vllm.plugins.lora_resolvers.hf_hub_resolver.register_hf_hub_resolver" ], "n_typable": 16, "n_typed": 13, "n_any": 0, "n_untyped": 3, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 7, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/profiler/layerwise_profile.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.profiler.layerwise_profile.StatsEntry", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.profiler.layerwise_profile.LayerwiseProfileResults", "methods": [ { "kind": "function", "name": "LayerwiseProfileResults.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LayerwiseProfileResults.print_model_table", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LayerwiseProfileResults.print_summary_table", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LayerwiseProfileResults.export_model_stats_table_csv", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LayerwiseProfileResults.export_summary_stats_table_csv", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LayerwiseProfileResults.convert_stats_to_dict", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LayerwiseProfileResults._indent_row_names_based_on_depth", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LayerwiseProfileResults._build_correlation_map", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LayerwiseProfileResults._build_module_tree", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LayerwiseProfileResults._get_kineto_gpu_event", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LayerwiseProfileResults._cumulative_cuda_time", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LayerwiseProfileResults._total_cuda_time", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LayerwiseProfileResults._build_stats_trees", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LayerwiseProfileResults._flatten_stats_tree", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LayerwiseProfileResults._convert_stats_tree_to_dict", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LayerwiseProfileResults._kineto_results", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerwiseProfileResults._kineto_event_correlation_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerwiseProfileResults._event_correlation_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerwiseProfileResults._module_tree", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerwiseProfileResults._model_stats_tree", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerwiseProfileResults._summary_stats_tree", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayerwiseProfileResults.num_running_seqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 25, "n_typed": 13, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 10, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.profiler.layerwise_profile.StatsEntryT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.profiler.layerwise_profile.pd", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.profiler.layerwise_profile.SummaryStatsEntry", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SummaryStatsEntry.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SummaryStatsEntry.cuda_time_us", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SummaryStatsEntry.pct_cuda_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SummaryStatsEntry.invocations", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.profiler.layerwise_profile.ModelStatsEntry", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelStatsEntry.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelStatsEntry.cpu_time_us", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelStatsEntry.cuda_time_us", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelStatsEntry.pct_cuda_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelStatsEntry.trace", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.profiler.layerwise_profile.layerwise_profile", "methods": [ { "kind": "function", "name": "layerwise_profile.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "layerwise_profile.__enter__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "layerwise_profile.__exit__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "layerwise_profile.num_running_seqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 1, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.profiler.layerwise_profile", "names": [ "vllm.profiler.layerwise_profile.LayerwiseProfileResults", "vllm.profiler.layerwise_profile.ModelStatsEntry", "vllm.profiler.layerwise_profile.StatsEntry", "vllm.profiler.layerwise_profile.StatsEntryT", "vllm.profiler.layerwise_profile.SummaryStatsEntry", "vllm.profiler.layerwise_profile.layerwise_profile", "vllm.profiler.layerwise_profile.pd" ], "n_typable": 35, "n_typed": 15, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 14, "n_classes": 4, "n_attrs": 20, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/profiler/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.profiler.utils.event_has_module", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.profiler.utils.TablePrinter", "methods": [ { "kind": "function", "name": "TablePrinter.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TablePrinter.print_table", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TablePrinter._print_header", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TablePrinter._print_row", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TablePrinter._print_line", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TablePrinter.row_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TablePrinter.fieldnames", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TablePrinter.column_widths", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 3, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.profiler.utils.event_module_repr", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.profiler.utils.trim_string_front", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.profiler.utils.event_torch_op_stack_trace", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.profiler.utils.event_is_torch_op", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.profiler.utils.event_arg_repr", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.profiler.utils.event_torch_op_repr", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.profiler.utils.indent_string", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.profiler.utils.trim_string_back", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.profiler.utils", "names": [ "vllm.profiler.utils.TablePrinter", "vllm.profiler.utils.event_arg_repr", "vllm.profiler.utils.event_has_module", "vllm.profiler.utils.event_is_torch_op", "vllm.profiler.utils.event_module_repr", "vllm.profiler.utils.event_torch_op_repr", "vllm.profiler.utils.event_torch_op_stack_trace", "vllm.profiler.utils.indent_string", "vllm.profiler.utils.trim_string_back", "vllm.profiler.utils.trim_string_front" ], "n_typable": 35, "n_typed": 25, "n_any": 0, "n_untyped": 10, "n_functions": 9, "n_function_overloads": 9, "n_function_params": 14, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/profiler/wrapper.py", "symbol_reports": [ { "kind": "class", "name": "vllm.profiler.wrapper.CudaProfilerWrapper", "methods": [ { "kind": "function", "name": "CudaProfilerWrapper.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudaProfilerWrapper._start", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaProfilerWrapper._stop", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaProfilerWrapper.annotate_context_manager", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.profiler.wrapper.WorkerProfiler", "methods": [ { "kind": "function", "name": "WorkerProfiler.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerProfiler._start", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerProfiler._stop", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerProfiler._call_start", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerProfiler._call_stop", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerProfiler.start", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerProfiler.step", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerProfiler.stop", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerProfiler.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerProfiler.annotate_context_manager", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.profiler.wrapper.TorchProfilerActivity", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.profiler.wrapper.TorchProfilerActivityMap", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.profiler.wrapper.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.profiler.wrapper.TorchProfilerWrapper", "methods": [ { "kind": "function", "name": "TorchProfilerWrapper.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "TorchProfilerWrapper._start", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TorchProfilerWrapper._stop", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TorchProfilerWrapper.annotate_context_manager", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TorchProfilerWrapper.local_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TorchProfilerWrapper.profiler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TorchProfilerWrapper.dump_cpu_time_total", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TorchProfilerWrapper.profiler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.profiler.wrapper", "names": [ "vllm.profiler.wrapper.CudaProfilerWrapper", "vllm.profiler.wrapper.TorchProfilerActivity", "vllm.profiler.wrapper.TorchProfilerActivityMap", "vllm.profiler.wrapper.TorchProfilerWrapper", "vllm.profiler.wrapper.WorkerProfiler", "vllm.profiler.wrapper.logger" ], "n_typable": 34, "n_typed": 26, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 10, "n_classes": 3, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/ray/lazy_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.ray.lazy_utils.is_ray_initialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.ray.lazy_utils.is_in_ray_actor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.ray.lazy_utils", "names": [ "vllm.ray.lazy_utils.is_in_ray_actor", "vllm.ray.lazy_utils.is_ray_initialized" ], "n_typable": 2, "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/ray/ray_env.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.ray.ray_env.RAY_NON_CARRY_OVER_ENV_VARS", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.ray.ray_env.RAY_NON_CARRY_OVER_ENV_VARS_FILE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.ray.ray_env.get_env_vars_to_copy", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.ray.ray_env.DEFAULT_ENV_VAR_PREFIXES", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.ray.ray_env.DEFAULT_EXTRA_ENV_VARS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.ray.ray_env.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.ray.ray_env", "names": [ "vllm.ray.ray_env.DEFAULT_ENV_VAR_PREFIXES", "vllm.ray.ray_env.DEFAULT_EXTRA_ENV_VARS", "vllm.ray.ray_env.RAY_NON_CARRY_OVER_ENV_VARS", "vllm.ray.ray_env.RAY_NON_CARRY_OVER_ENV_VARS_FILE", "vllm.ray.ray_env.get_env_vars_to_copy", "vllm.ray.ray_env.logger" ], "n_typable": 9, "n_typed": 6, "n_any": 0, "n_untyped": 3, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/reasoning/abs_reasoning_parsers.py", "symbol_reports": [ { "kind": "class", "name": "vllm.reasoning.abs_reasoning_parsers.ReasoningParserManager", "methods": [ { "kind": "function", "name": "ReasoningParserManager.get_reasoning_parser", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ReasoningParserManager.list_registered", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ReasoningParserManager._load_lazy_parser", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ReasoningParserManager._register_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ReasoningParserManager.register_lazy_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ReasoningParserManager.register_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ReasoningParserManager.import_reasoning_parser", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ReasoningParserManager.reasoning_parsers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ReasoningParserManager.lazy_parsers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 21, "n_typed": 21, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 12, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.reasoning.abs_reasoning_parsers.ReasoningParser", "methods": [ { "kind": "function", "name": "ReasoningParser.__init__", "n_typed": 0, "n_any": 1, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ReasoningParser.is_reasoning_end", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ReasoningParser.is_reasoning_end_streaming", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ReasoningParser.extract_content_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ReasoningParser.count_reasoning_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "ReasoningParser.prepare_structured_tag", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "ReasoningParser.vocab", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ReasoningParser.model_tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 23, "n_any": 1, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 18, "n_attrs": 1, "n_properties": 1 }, { "kind": "attr", "name": "vllm.reasoning.abs_reasoning_parsers.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.reasoning.abs_reasoning_parsers", "names": [ "vllm.reasoning.abs_reasoning_parsers.ReasoningParser", "vllm.reasoning.abs_reasoning_parsers.ReasoningParserManager", "vllm.reasoning.abs_reasoning_parsers.logger" ], "n_typable": 50, "n_typed": 44, "n_any": 1, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 30, "n_classes": 2, "n_attrs": 4, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/reasoning/basic_parsers.py", "symbol_reports": [ { "kind": "class", "name": "vllm.reasoning.basic_parsers.BaseThinkingReasoningParser", "methods": [ { "kind": "function", "name": "BaseThinkingReasoningParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseThinkingReasoningParser.is_reasoning_end", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseThinkingReasoningParser.is_reasoning_end_streaming", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseThinkingReasoningParser.extract_content_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseThinkingReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BaseThinkingReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseThinkingReasoningParser.count_reasoning_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "BaseThinkingReasoningParser.start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "BaseThinkingReasoningParser.end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "BaseThinkingReasoningParser.start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseThinkingReasoningParser.end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 22, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 16, "n_attrs": 2, "n_properties": 2 } ], "type_ignores": [], "name": "vllm.reasoning.basic_parsers", "names": [ "vllm.reasoning.basic_parsers.BaseThinkingReasoningParser" ], "n_typable": 27, "n_typed": 22, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 16, "n_classes": 1, "n_attrs": 2, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/reasoning/deepseek_r1_reasoning_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.reasoning.deepseek_r1_reasoning_parser.DeepSeekR1ReasoningParser", "methods": [ { "kind": "function", "name": "DeepSeekR1ReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "DeepSeekR1ReasoningParser.start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "DeepSeekR1ReasoningParser.end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_attrs": 0, "n_properties": 2 } ], "type_ignores": [], "name": "vllm.reasoning.deepseek_r1_reasoning_parser", "names": [ "vllm.reasoning.deepseek_r1_reasoning_parser.DeepSeekR1ReasoningParser" ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_classes": 1, "n_attrs": 0, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/reasoning/deepseek_v3_reasoning_parser.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.reasoning.deepseek_v3_reasoning_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.reasoning.deepseek_v3_reasoning_parser.DeepSeekV3ReasoningWithThinkingParser", "methods": [ { "kind": "function", "name": "DeepSeekV3ReasoningWithThinkingParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.reasoning.deepseek_v3_reasoning_parser.DeepSeekV3ReasoningParser", "methods": [ { "kind": "function", "name": "DeepSeekV3ReasoningParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepSeekV3ReasoningParser.is_reasoning_end", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepSeekV3ReasoningParser.is_reasoning_end_streaming", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepSeekV3ReasoningParser.extract_content_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepSeekV3ReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepSeekV3ReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [], "n_typable": 21, "n_typed": 18, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.reasoning.deepseek_v3_reasoning_parser", "names": [ "vllm.reasoning.deepseek_v3_reasoning_parser.DeepSeekV3ReasoningParser", "vllm.reasoning.deepseek_v3_reasoning_parser.DeepSeekV3ReasoningWithThinkingParser", "vllm.reasoning.deepseek_v3_reasoning_parser.logger" ], "n_typable": 26, "n_typed": 19, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 18, "n_classes": 2, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/reasoning/ernie45_reasoning_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.reasoning.ernie45_reasoning_parser.Ernie45ReasoningParser", "methods": [ { "kind": "function", "name": "Ernie45ReasoningParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Ernie45ReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Ernie45ReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "Ernie45ReasoningParser.start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Ernie45ReasoningParser.end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Ernie45ReasoningParser.response_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ReasoningParser.response_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ReasoningParser.newline_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ReasoningParser.start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ReasoningParser.end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ReasoningParser.response_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ReasoningParser.response_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ReasoningParser.newline_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ReasoningParser.parser_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 16, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 9, "n_properties": 2 }, { "kind": "attr", "name": "vllm.reasoning.ernie45_reasoning_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.reasoning.ernie45_reasoning_parser", "names": [ "vllm.reasoning.ernie45_reasoning_parser.Ernie45ReasoningParser", "vllm.reasoning.ernie45_reasoning_parser.logger" ], "n_typable": 26, "n_typed": 16, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_classes": 1, "n_attrs": 10, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/reasoning/gptoss_reasoning_parser.py", "symbol_reports": [ { "kind": "function", "name": "vllm.reasoning.gptoss_reasoning_parser.from_builtin_tool_to_tag", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.reasoning.gptoss_reasoning_parser.tag_with_builtin_funcs", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.reasoning.gptoss_reasoning_parser.no_func_reaonsing_tag", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.reasoning.gptoss_reasoning_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.reasoning.gptoss_reasoning_parser.GptOssReasoningParser", "methods": [ { "kind": "function", "name": "GptOssReasoningParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GptOssReasoningParser.is_reasoning_end", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GptOssReasoningParser.extract_content_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GptOssReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "GptOssReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GptOssReasoningParser.prepare_structured_tag", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GptOssReasoningParser.reasoning_end_token_ids_prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GptOssReasoningParser.reasoning_end_token_ids_suffix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GptOssReasoningParser.eom_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GptOssReasoningParser.reasoning_max_num_between_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 18, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.reasoning.gptoss_reasoning_parser", "names": [ "vllm.reasoning.gptoss_reasoning_parser.GptOssReasoningParser", "vllm.reasoning.gptoss_reasoning_parser.from_builtin_tool_to_tag", "vllm.reasoning.gptoss_reasoning_parser.logger", "vllm.reasoning.gptoss_reasoning_parser.no_func_reaonsing_tag", "vllm.reasoning.gptoss_reasoning_parser.tag_with_builtin_funcs" ], "n_typable": 31, "n_typed": 22, "n_any": 0, "n_untyped": 9, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 3, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/reasoning/granite_reasoning_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.reasoning.granite_reasoning_parser.GraniteReasoningParser", "methods": [ { "kind": "function", "name": "GraniteReasoningParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GraniteReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "GraniteReasoningParser._is_reasoning_start_substr", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteReasoningParser._is_response_start_substr", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteReasoningParser._get_delta_message_with_no_reasoning_bounds", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteReasoningParser._get_delta_message_with_no_response_bounds", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GraniteReasoningParser._get_delta_message_with_both_bounds", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "GraniteReasoningParser._get_content_sections", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteReasoningParser.think_start_expr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteReasoningParser.response_start_expr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteReasoningParser.reasoning_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteReasoningParser.valid_think_starts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteReasoningParser.valid_response_starts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteReasoningParser.seq_boundary_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteReasoningParser.seq_boundary_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteReasoningParser.longest_think_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 41, "n_typed": 30, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 24, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.reasoning.granite_reasoning_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.reasoning.granite_reasoning_parser", "names": [ "vllm.reasoning.granite_reasoning_parser.GraniteReasoningParser", "vllm.reasoning.granite_reasoning_parser.logger" ], "n_typable": 42, "n_typed": 30, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 24, "n_classes": 1, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/reasoning/hunyuan_a13b_reasoning_parser.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.reasoning.hunyuan_a13b_reasoning_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.reasoning.hunyuan_a13b_reasoning_parser.HunyuanA13BReasoningParser", "methods": [ { "kind": "function", "name": "HunyuanA13BReasoningParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "HunyuanA13BReasoningParser.is_reasoning_end", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunyuanA13BReasoningParser.extract_content_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunyuanA13BReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunyuanA13BReasoningParser._is_strict_increasing_subsequence", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunyuanA13BReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunyuanA13BReasoningParser.think_start_expr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.think_end_expr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.response_start_expr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.response_end_expr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.full_match_reasoning_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.half_match_reasoning_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.think_start_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.think_start_ids_fast", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.response_start_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.response_start_ids_fast", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.response_end_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.fast_think_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.buffered_text", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.buffered_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.current_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.all_states", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.expected_sequence", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.expected_sequence_side", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.sequence_index", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.token_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BReasoningParser.text_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 42, "n_typed": 18, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_attrs": 21, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.reasoning.hunyuan_a13b_reasoning_parser", "names": [ "vllm.reasoning.hunyuan_a13b_reasoning_parser.HunyuanA13BReasoningParser", "vllm.reasoning.hunyuan_a13b_reasoning_parser.logger" ], "n_typable": 43, "n_typed": 18, "n_any": 0, "n_untyped": 25, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_classes": 1, "n_attrs": 22, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/reasoning/identity_reasoning_parser.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.reasoning.identity_reasoning_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.reasoning.identity_reasoning_parser.IdentityReasoningParser", "methods": [ { "kind": "function", "name": "IdentityReasoningParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "IdentityReasoningParser.is_reasoning_end", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IdentityReasoningParser.is_reasoning_end_streaming", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "IdentityReasoningParser.extract_content_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IdentityReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "IdentityReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 21, "n_typed": 18, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.reasoning.identity_reasoning_parser", "names": [ "vllm.reasoning.identity_reasoning_parser.IdentityReasoningParser", "vllm.reasoning.identity_reasoning_parser.logger" ], "n_typable": 22, "n_typed": 18, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/reasoning/kimi_k2_reasoning_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.reasoning.kimi_k2_reasoning_parser.KimiK2ReasoningParser", "methods": [ { "kind": "function", "name": "KimiK2ReasoningParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KimiK2ReasoningParser._is_identity_mode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KimiK2ReasoningParser.is_reasoning_end", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiK2ReasoningParser.is_reasoning_end_streaming", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KimiK2ReasoningParser.extract_content_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiK2ReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KimiK2ReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [], "n_typable": 22, "n_typed": 19, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 15, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.reasoning.kimi_k2_reasoning_parser", "names": [ "vllm.reasoning.kimi_k2_reasoning_parser.KimiK2ReasoningParser" ], "n_typable": 22, "n_typed": 19, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 15, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/reasoning/minimax_m2_reasoning_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.reasoning.minimax_m2_reasoning_parser.MiniMaxM2ReasoningParser", "methods": [ { "kind": "function", "name": "MiniMaxM2ReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "MiniMaxM2ReasoningParser.start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MiniMaxM2ReasoningParser.end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_attrs": 0, "n_properties": 2 }, { "kind": "class", "name": "vllm.reasoning.minimax_m2_reasoning_parser.MiniMaxM2AppendThinkReasoningParser", "methods": [ { "kind": "function", "name": "MiniMaxM2AppendThinkReasoningParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MiniMaxM2AppendThinkReasoningParser.is_reasoning_end", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxM2AppendThinkReasoningParser.extract_content_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MiniMaxM2AppendThinkReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MiniMaxM2AppendThinkReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiniMaxM2AppendThinkReasoningParser.end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiniMaxM2AppendThinkReasoningParser.start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 15, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.reasoning.minimax_m2_reasoning_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.reasoning.minimax_m2_reasoning_parser", "names": [ "vllm.reasoning.minimax_m2_reasoning_parser.MiniMaxM2AppendThinkReasoningParser", "vllm.reasoning.minimax_m2_reasoning_parser.MiniMaxM2ReasoningParser", "vllm.reasoning.minimax_m2_reasoning_parser.logger" ], "n_typable": 30, "n_typed": 24, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 19, "n_classes": 2, "n_attrs": 3, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/reasoning/mistral_reasoning_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.reasoning.mistral_reasoning_parser.MistralReasoningParser", "methods": [ { "kind": "function", "name": "MistralReasoningParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MistralReasoningParser.is_reasoning_end", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MistralReasoningParser.extract_content_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MistralReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "MistralReasoningParser.start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MistralReasoningParser.end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MistralReasoningParser.start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MistralReasoningParser.end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 10, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 2, "n_properties": 2 }, { "kind": "attr", "name": "vllm.reasoning.mistral_reasoning_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.reasoning.mistral_reasoning_parser", "names": [ "vllm.reasoning.mistral_reasoning_parser.MistralReasoningParser", "vllm.reasoning.mistral_reasoning_parser.logger" ], "n_typable": 16, "n_typed": 10, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_classes": 1, "n_attrs": 3, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/reasoning/nemotron_v3_reasoning_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.reasoning.nemotron_v3_reasoning_parser.NemotronV3ReasoningParser", "methods": [ { "kind": "function", "name": "NemotronV3ReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.reasoning.nemotron_v3_reasoning_parser", "names": [ "vllm.reasoning.nemotron_v3_reasoning_parser.NemotronV3ReasoningParser" ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/reasoning/olmo3_reasoning_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.reasoning.olmo3_reasoning_parser.Indices", "methods": [ { "kind": "function", "name": "Indices.__len__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Indices.start", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Indices.end", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.reasoning.olmo3_reasoning_parser.Olmo3ReasoningBuffer", "methods": [ { "kind": "function", "name": "Olmo3ReasoningBuffer.process_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Olmo3ReasoningBuffer.__len__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Olmo3ReasoningBuffer.add_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Olmo3ReasoningBuffer.think_start", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Olmo3ReasoningBuffer.think_end", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Olmo3ReasoningBuffer.buffer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Olmo3ReasoningBuffer.state", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.reasoning.olmo3_reasoning_parser.Olmo3ReasoningParser", "methods": [ { "kind": "function", "name": "Olmo3ReasoningParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Olmo3ReasoningParser.is_reasoning_end", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Olmo3ReasoningParser.extract_content_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Olmo3ReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Olmo3ReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Olmo3ReasoningParser.think_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3ReasoningParser.think_end", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3ReasoningParser.reasoning_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3ReasoningParser.buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 15, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.reasoning.olmo3_reasoning_parser.string_overlap", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.reasoning.olmo3_reasoning_parser.Olmo3ReasoningState", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Olmo3ReasoningState.REASONING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Olmo3ReasoningState.CONTENT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.reasoning.olmo3_reasoning_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.reasoning.olmo3_reasoning_parser", "names": [ "vllm.reasoning.olmo3_reasoning_parser.Indices", "vllm.reasoning.olmo3_reasoning_parser.Olmo3ReasoningBuffer", "vllm.reasoning.olmo3_reasoning_parser.Olmo3ReasoningParser", "vllm.reasoning.olmo3_reasoning_parser.Olmo3ReasoningState", "vllm.reasoning.olmo3_reasoning_parser.logger", "vllm.reasoning.olmo3_reasoning_parser.string_overlap" ], "n_typable": 31, "n_typed": 21, "n_any": 0, "n_untyped": 10, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 14, "n_classes": 4, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/reasoning/qwen3_reasoning_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.reasoning.qwen3_reasoning_parser.Qwen3ReasoningParser", "methods": [ { "kind": "function", "name": "Qwen3ReasoningParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3ReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3ReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "Qwen3ReasoningParser.start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Qwen3ReasoningParser.end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Qwen3ReasoningParser.thinking_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 13, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 1, "n_properties": 2 } ], "type_ignores": [], "name": "vllm.reasoning.qwen3_reasoning_parser", "names": [ "vllm.reasoning.qwen3_reasoning_parser.Qwen3ReasoningParser" ], "n_typable": 17, "n_typed": 13, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_classes": 1, "n_attrs": 1, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/reasoning/seedoss_reasoning_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.reasoning.seedoss_reasoning_parser.SeedOSSReasoningParser", "methods": [], "properties": [ { "kind": "property", "name": "SeedOSSReasoningParser.start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "SeedOSSReasoningParser.end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 2 } ], "type_ignores": [], "name": "vllm.reasoning.seedoss_reasoning_parser", "names": [ "vllm.reasoning.seedoss_reasoning_parser.SeedOSSReasoningParser" ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 0, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/reasoning/step3_reasoning_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.reasoning.step3_reasoning_parser.Step3ReasoningParser", "methods": [ { "kind": "function", "name": "Step3ReasoningParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Step3ReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Step3ReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3ReasoningParser.is_reasoning_end", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3ReasoningParser.is_reasoning_end_streaming", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3ReasoningParser.extract_content_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3ReasoningParser.think_end_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3ReasoningParser.reasoning_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3ReasoningParser.think_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 18, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.reasoning.step3_reasoning_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.reasoning.step3_reasoning_parser", "names": [ "vllm.reasoning.step3_reasoning_parser.Step3ReasoningParser", "vllm.reasoning.step3_reasoning_parser.logger" ], "n_typable": 25, "n_typed": 18, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/reasoning/step3p5_reasoning_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.reasoning.step3p5_reasoning_parser.Step3p5ReasoningParser", "methods": [ { "kind": "function", "name": "Step3p5ReasoningParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Step3p5ReasoningParser.is_reasoning_end", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3p5ReasoningParser.is_reasoning_end_streaming", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3p5ReasoningParser._is_reasoning_end_from_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3p5ReasoningParser.extract_reasoning", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3p5ReasoningParser.extract_reasoning_streaming", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "Step3p5ReasoningParser.start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Step3p5ReasoningParser.end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 23, "n_typed": 20, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_attrs": 0, "n_properties": 2 } ], "type_ignores": [], "name": "vllm.reasoning.step3p5_reasoning_parser", "names": [ "vllm.reasoning.step3p5_reasoning_parser.Step3p5ReasoningParser" ], "n_typable": 23, "n_typed": 20, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_classes": 1, "n_attrs": 0, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/renderers/params.py", "symbol_reports": [ { "kind": "function", "name": "vllm.renderers.params.merge_kwargs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.renderers.params.ChatParams", "methods": [ { "kind": "function", "name": "ChatParams.with_defaults", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChatParams.get_apply_chat_template_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatParams.chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChatParams.chat_template_content_format", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChatParams.chat_template_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.renderers.params.TokenizeParams", "methods": [ { "kind": "function", "name": "TokenizeParams.__post_init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TokenizeParams.with_kwargs", "n_typed": 0, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TokenizeParams.get_encode_kwargs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TokenizeParams._text_len_check", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TokenizeParams._text_lowercase", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TokenizeParams._validate_text", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TokenizeParams.apply_pre_tokenization", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TokenizeParams._token_padding", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TokenizeParams._token_truncation", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TokenizeParams._token_len_check", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TokenizeParams._validate_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TokenizeParams.apply_post_tokenization", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "TokenizeParams.max_input_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "TokenizeParams.max_total_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TokenizeParams.max_output_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TokenizeParams.pad_prompt_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TokenizeParams.truncate_prompt_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TokenizeParams.do_lower_case", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TokenizeParams.add_special_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TokenizeParams.needs_detokenization", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TokenizeParams.max_total_tokens_param", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TokenizeParams.max_output_tokens_param", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TokenizeParams.truncate_prompt_tokens_param", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 32, "n_typed": 30, "n_any": 1, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 19, "n_attrs": 10, "n_properties": 1 }, { "kind": "attr", "name": "vllm.renderers.params.torch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.renderers.params.ChatTemplateContentFormatOption", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.renderers.params.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.renderers.params", "names": [ "vllm.renderers.params.ChatParams", "vllm.renderers.params.ChatTemplateContentFormatOption", "vllm.renderers.params.TokenizeParams", "vllm.renderers.params.logger", "vllm.renderers.params.merge_kwargs", "vllm.renderers.params.torch" ], "n_typable": 41, "n_typed": 36, "n_any": 1, "n_untyped": 4, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 20, "n_classes": 2, "n_attrs": 16, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/renderers/registry.py", "symbol_reports": [ { "kind": "function", "name": "vllm.renderers.registry.renderer_from_config", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.renderers.registry.RendererRegistry", "methods": [ { "kind": "function", "name": "RendererRegistry.register", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RendererRegistry.load_renderer_cls", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RendererRegistry.load_renderer", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RendererRegistry.renderers", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.renderers.registry.RENDERER_REGISTRY", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.renderers.registry.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.renderers.registry", "names": [ "vllm.renderers.registry.RENDERER_REGISTRY", "vllm.renderers.registry.RendererRegistry", "vllm.renderers.registry.logger", "vllm.renderers.registry.renderer_from_config" ], "n_typable": 15, "n_typed": 11, "n_any": 0, "n_untyped": 4, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/renderers/base.py", "symbol_reports": [ { "kind": "class", "name": "vllm.renderers.base.BaseRenderer", "methods": [ { "kind": "function", "name": "BaseRenderer.from_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer.get_tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseRenderer.get_async_tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseRenderer.get_mm_processor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseRenderer.stat_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseRenderer.update_mm_cache_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseRenderer.clear_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseRenderer.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseRenderer.get_bos_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseRenderer.get_eos_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseRenderer.get_dec_start_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BaseRenderer.render_prompt", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseRenderer.render_prompts", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseRenderer.render_prompts_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseRenderer.render_messages", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer.render_messages_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer._tokenize_prompt", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer._tokenize_prompt_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer._detokenize_prompt", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseRenderer._detokenize_prompt_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseRenderer._tokenize_singleton_prompt", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 3, "n_params": 2, "n_function_overloads": 2, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer._tokenize_singleton_prompt_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 3, "n_params": 2, "n_function_overloads": 2, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer._tokenize_enc_dec_prompt", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer._tokenize_enc_dec_prompt_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer.tokenize_prompt", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer.tokenize_prompts", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer.tokenize_prompt_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer.tokenize_prompts_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer._apply_prompt_extras", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer._validate_mm_uuids", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseRenderer._process_mm_uuids", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaseRenderer._process_multimodal", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BaseRenderer._process_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseRenderer._process_embeds", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseRenderer._process_singleton", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseRenderer._process_enc_dec", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseRenderer.process_for_engine", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseRenderer.render_cmpl", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseRenderer.render_cmpl_async", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseRenderer.render_chat", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaseRenderer.render_chat_async", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [ { "kind": "property", "name": "BaseRenderer.mm_processor_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "BaseRenderer.default_cmpl_tok_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "BaseRenderer.default_chat_tok_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "BaseRenderer.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseRenderer.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseRenderer.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseRenderer.mm_processor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 116, "n_typed": 107, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 42, "n_method_overloads": 44, "n_method_params": 67, "n_attrs": 4, "n_properties": 3 }, { "kind": "attr", "name": "vllm.renderers.base.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.renderers.base", "names": [ "vllm.renderers.base.BaseRenderer", "vllm.renderers.base.logger" ], "n_typable": 117, "n_typed": 107, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 42, "n_method_overloads": 44, "n_method_params": 67, "n_classes": 1, "n_attrs": 5, "n_properties": 3, "n_type_ignores": 0 }, { "path": "vllm/renderers/deepseek_v32.py", "symbol_reports": [ { "kind": "class", "name": "vllm.renderers.deepseek_v32.DeepseekV32Renderer", "methods": [ { "kind": "function", "name": "DeepseekV32Renderer.from_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekV32Renderer.render_messages", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekV32Renderer.render_messages_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.renderers.deepseek_v32.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.renderers.deepseek_v32", "names": [ "vllm.renderers.deepseek_v32.DeepseekV32Renderer", "vllm.renderers.deepseek_v32.logger" ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/renderers/embed_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.renderers.embed_utils.safe_load_prompt_embeds", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.renderers.embed_utils", "names": [ "vllm.renderers.embed_utils.safe_load_prompt_embeds" ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/renderers/grok2.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.renderers.grok2.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.renderers.grok2.Grok2Renderer", "methods": [ { "kind": "function", "name": "Grok2Renderer.from_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Grok2Renderer.render_messages", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Grok2Renderer.render_messages_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.renderers.grok2", "names": [ "vllm.renderers.grok2.Grok2Renderer", "vllm.renderers.grok2.logger" ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/renderers/hf.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.renderers.hf.MultiModalUUIDDict", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.renderers.hf.resolve_chat_template_kwargs", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.renderers.hf.replace_vision_chunk_video_placeholder", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.renderers.hf.resolve_chat_template", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.renderers.hf.AssistantTracker", "methods": [ { "kind": "function", "name": "AssistantTracker.parse", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AssistantTracker.tags", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.renderers.hf.HfRenderer", "methods": [ { "kind": "function", "name": "HfRenderer.from_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HfRenderer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HfRenderer.render_messages", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HfRenderer.render_messages_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HfRenderer.use_unified_vision_chunk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.renderers.hf.safe_apply_chat_template", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.renderers.hf.resolve_chat_template_content_format", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.renderers.hf.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.renderers.hf.build_video_prompts_from_mm_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.renderers.hf.rebuild_mm_uuids_from_mm_data", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.renderers.hf.MultiModalDataDict", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.renderers.hf", "names": [ "vllm.renderers.hf.AssistantTracker", "vllm.renderers.hf.HfRenderer", "vllm.renderers.hf.MultiModalDataDict", "vllm.renderers.hf.MultiModalUUIDDict", "vllm.renderers.hf.build_video_prompts_from_mm_data", "vllm.renderers.hf.logger", "vllm.renderers.hf.rebuild_mm_uuids_from_mm_data", "vllm.renderers.hf.replace_vision_chunk_video_placeholder", "vllm.renderers.hf.resolve_chat_template", "vllm.renderers.hf.resolve_chat_template_content_format", "vllm.renderers.hf.resolve_chat_template_kwargs", "vllm.renderers.hf.safe_apply_chat_template" ], "n_typable": 49, "n_typed": 46, "n_any": 0, "n_untyped": 3, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 26, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_classes": 2, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/renderers/inputs/preprocess.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.renderers.inputs.preprocess.EncoderDictPrompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.renderers.inputs.preprocess.EncoderDecoderDictPrompt", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EncoderDecoderDictPrompt.encoder_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EncoderDecoderDictPrompt.decoder_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.renderers.inputs.preprocess.DecoderDictPrompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.renderers.inputs.preprocess.DecoderOnlyDictPrompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.renderers.inputs.preprocess.SingletonDictPrompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.renderers.inputs.preprocess.DictPrompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.renderers.inputs.preprocess.parse_model_prompt", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.renderers.inputs.preprocess.prompt_to_seq", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 3, "n_typable": 2, "n_params": 1, "n_function_overloads": 3, "n_function_params": 1 }, { "kind": "function", "name": "vllm.renderers.inputs.preprocess.conversation_to_seq", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.renderers.inputs.preprocess.parse_enc_dec_prompt", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.renderers.inputs.preprocess.extract_target_prompt", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.renderers.inputs.preprocess.parse_dec_only_prompt", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.renderers.inputs.preprocess.extract_prompt_len", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.renderers.inputs.preprocess.PromptComponents", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PromptComponents.text", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PromptComponents.token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PromptComponents.embeds", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.renderers.inputs.preprocess.extract_prompt_components", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.renderers.inputs.preprocess", "names": [ "vllm.renderers.inputs.preprocess.DecoderDictPrompt", "vllm.renderers.inputs.preprocess.DecoderOnlyDictPrompt", "vllm.renderers.inputs.preprocess.DictPrompt", "vllm.renderers.inputs.preprocess.EncoderDecoderDictPrompt", "vllm.renderers.inputs.preprocess.EncoderDictPrompt", "vllm.renderers.inputs.preprocess.PromptComponents", "vllm.renderers.inputs.preprocess.SingletonDictPrompt", "vllm.renderers.inputs.preprocess.conversation_to_seq", "vllm.renderers.inputs.preprocess.extract_prompt_components", "vllm.renderers.inputs.preprocess.extract_prompt_len", "vllm.renderers.inputs.preprocess.extract_target_prompt", "vllm.renderers.inputs.preprocess.parse_dec_only_prompt", "vllm.renderers.inputs.preprocess.parse_enc_dec_prompt", "vllm.renderers.inputs.preprocess.parse_model_prompt", "vllm.renderers.inputs.preprocess.prompt_to_seq" ], "n_typable": 25, "n_typed": 22, "n_any": 0, "n_untyped": 3, "n_functions": 8, "n_function_overloads": 10, "n_function_params": 12, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 2, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/renderers/inputs/tokenize.py", "symbol_reports": [ { "kind": "class", "name": "vllm.renderers.inputs.tokenize.EncoderDecoderTokPrompt", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EncoderDecoderTokPrompt.encoder_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EncoderDecoderTokPrompt.decoder_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.renderers.inputs.tokenize.TokPrompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.renderers.inputs.tokenize.DecoderOnlyTokPrompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.renderers.inputs.tokenize.SingletonTokPrompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.renderers.inputs.tokenize.DecoderTokPrompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.renderers.inputs.tokenize.EncoderTokPrompt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.renderers.inputs.tokenize", "names": [ "vllm.renderers.inputs.tokenize.DecoderOnlyTokPrompt", "vllm.renderers.inputs.tokenize.DecoderTokPrompt", "vllm.renderers.inputs.tokenize.EncoderDecoderTokPrompt", "vllm.renderers.inputs.tokenize.EncoderTokPrompt", "vllm.renderers.inputs.tokenize.SingletonTokPrompt", "vllm.renderers.inputs.tokenize.TokPrompt" ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/renderers/mistral.py", "symbol_reports": [ { "kind": "function", "name": "vllm.renderers.mistral.safe_apply_chat_template", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.renderers.mistral.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.renderers.mistral.MistralRenderer", "methods": [ { "kind": "function", "name": "MistralRenderer.from_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MistralRenderer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MistralRenderer.render_messages", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MistralRenderer.render_messages_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.renderers.mistral", "names": [ "vllm.renderers.mistral.MistralRenderer", "vllm.renderers.mistral.logger", "vllm.renderers.mistral.safe_apply_chat_template" ], "n_typable": 17, "n_typed": 15, "n_any": 0, "n_untyped": 2, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/renderers/qwen_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.renderers.qwen_vl.QwenVLRenderer", "methods": [ { "kind": "function", "name": "QwenVLRenderer.from_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.renderers.qwen_vl", "names": [ "vllm.renderers.qwen_vl.QwenVLRenderer" ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/renderers/terratorch.py", "symbol_reports": [ { "kind": "class", "name": "vllm.renderers.terratorch.TerratorchRenderer", "methods": [ { "kind": "function", "name": "TerratorchRenderer.from_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TerratorchRenderer.render_messages", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TerratorchRenderer.render_messages_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.renderers.terratorch.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.renderers.terratorch", "names": [ "vllm.renderers.terratorch.TerratorchRenderer", "vllm.renderers.terratorch.logger" ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/scalar_type.py", "symbol_reports": [ { "kind": "class", "name": "vllm.scalar_type.ScalarType", "methods": [ { "kind": "function", "name": "ScalarType._floating_point_max_int", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType._floating_point_max", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType._raw_max", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType._raw_min", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType.min", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType.max", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType.is_signed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType.is_floating_point", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType.is_integer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType.has_bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType.has_infs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType.has_nans", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType.is_ieee_754", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType.__str__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType.__len__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ScalarType.int_", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ScalarType.uint", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ScalarType.float_IEEE754", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ScalarType.float_", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ScalarType.from_id", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "ScalarType.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "ScalarType.size_bits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ScalarType.exponent", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScalarType.mantissa", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScalarType.signed", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScalarType.bias", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScalarType._finite_values_only", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScalarType.nan_repr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 34, "n_typed": 33, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 11, "n_attrs": 6, "n_properties": 2 }, { "kind": "class", "name": "vllm.scalar_type.NanRepr", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NanRepr.NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NanRepr.IEEE_754", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NanRepr.EXTD_RANGE_MAX_MIN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.scalar_type.scalar_types", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "scalar_types.int4", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.uint4", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.int8", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.uint8", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.float8_e4m3fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.float8_e5m2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.float8_e8m0fnu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.float16_e8m7", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.float16_e5m10", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.float6_e3m2f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.float6_e2m3f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.float4_e2m1f", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.uint2b2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.uint3b4", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.uint4b8", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.uint8b128", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "scalar_types.bfloat16", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "scalar_types.float16", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 16, "n_typed": 0, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 18, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.scalar_type", "names": [ "vllm.scalar_type.NanRepr", "vllm.scalar_type.ScalarType", "vllm.scalar_type.scalar_types" ], "n_typable": 50, "n_typed": 33, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 11, "n_classes": 3, "n_attrs": 27, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/scripts.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.scripts.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.scripts.main", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.scripts", "names": [ "vllm.scripts.logger", "vllm.scripts.main" ], "n_typable": 2, "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/sequence.py", "symbol_reports": [ { "kind": "class", "name": "vllm.sequence.IntermediateTensors", "methods": [ { "kind": "function", "name": "IntermediateTensors.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "IntermediateTensors.__getitem__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IntermediateTensors.__setitem__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "IntermediateTensors.items", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "IntermediateTensors.__len__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "IntermediateTensors.__eq__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IntermediateTensors.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "IntermediateTensors.tensors", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IntermediateTensors.kv_connector_output", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 6, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.sequence", "names": [ "vllm.sequence.IntermediateTensors" ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 6, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tasks.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.tasks.POOLING_TASKS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tasks.GenerationTask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tasks.SupportedTask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tasks.GENERATION_TASKS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tasks.PoolingTask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tasks", "names": [ "vllm.tasks.GENERATION_TASKS", "vllm.tasks.GenerationTask", "vllm.tasks.POOLING_TASKS", "vllm.tasks.PoolingTask", "vllm.tasks.SupportedTask" ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/third_party/flashmla/flash_mla_interface.py", "symbol_reports": [ { "kind": "function", "name": "vllm.third_party.flashmla.flash_mla_interface.flash_attn_varlen_func", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "vllm.third_party.flashmla.flash_mla_interface.get_mla_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.third_party.flashmla.flash_mla_interface.Config", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Config.b", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Config.s_q", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Config.h_q", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Config.page_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Config.h_k", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Config.causal", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Config.is_fp8_kvcache", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Config.topk", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Config.extra_page_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Config.extra_topk", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.flashmla.flash_mla_interface.FlashMLASchedMeta", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashMLASchedMeta.have_initialized", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashMLASchedMeta.config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashMLASchedMeta.tile_scheduler_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashMLASchedMeta.num_splits", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.flashmla.flash_mla_interface.flash_mla_sparse_fwd", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "class", "name": "vllm.third_party.flashmla.flash_mla_interface.FlashAttnVarlenFunc", "methods": [ { "kind": "function", "name": "FlashAttnVarlenFunc.forward", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "FlashAttnVarlenFunc.backward", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 14, "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.flashmla.flash_mla_interface.flash_mla_with_kvcache", "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "vllm.third_party.flashmla.flash_mla_interface.flash_attn_varlen_qkvpacked_func", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.third_party.flashmla.flash_mla_interface.flash_attn_varlen_kvpacked_func", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 } ], "type_ignores": [], "name": "vllm.third_party.flashmla.flash_mla_interface", "names": [ "vllm.third_party.flashmla.flash_mla_interface.Config", "vllm.third_party.flashmla.flash_mla_interface.FlashAttnVarlenFunc", "vllm.third_party.flashmla.flash_mla_interface.FlashMLASchedMeta", "vllm.third_party.flashmla.flash_mla_interface.flash_attn_varlen_func", "vllm.third_party.flashmla.flash_mla_interface.flash_attn_varlen_kvpacked_func", "vllm.third_party.flashmla.flash_mla_interface.flash_attn_varlen_qkvpacked_func", "vllm.third_party.flashmla.flash_mla_interface.flash_mla_sparse_fwd", "vllm.third_party.flashmla.flash_mla_interface.flash_mla_with_kvcache", "vllm.third_party.flashmla.flash_mla_interface.get_mla_metadata" ], "n_typable": 78, "n_typed": 75, "n_any": 0, "n_untyped": 3, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 58, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_classes": 3, "n_attrs": 14, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/third_party/pynvml.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlPowerSmoothingProfile_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_COMPATIBILITY_LIMIT_HOST_DRIVER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_ACOUSTIC_MAX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGspFirmwareMode", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlCoolerInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlCoolerInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_STATE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlWorkloadPowerProfileRequestedProfiles_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_CPU_CAPS_NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_EXPIRY_NOT_APPLICABLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VALUE_NOT_AVAILABLE_uint", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetVirtualizationMode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_LINK_MAX_SPEED_8000MBPS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetVgpuProcessUtilization", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetFBCSessions", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.nvmlVgpuRuntimeState_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "nvmlVgpuRuntimeState_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceIsMigDeviceHandle", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPowerState", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L8_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuPlacementList_v2_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuPlacementList_v2_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L5", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_VIRTUALIZATION_MODE_HOST_VSGA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_SMOOTHING_PROFILE_PARAM_RAMP_UP_RATE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_TOTAL_SUPPORTED_BW_MODES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetTotalEccErrors", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetHandleBySerial", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetVgpuTypeCreatablePlacements", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_COOLER_TARGET_POWER_SUPPLY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_1_SLICE_REV2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_THERMAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventMigConfigChange", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_ENGINE_PROFILE_SHARED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceClearAccountingPids", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetAutoBoostedClocksEnabled", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ADAPTIVE_CLOCKING_INFO_STATUS_DISABLED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L11", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetVgpuMetadata", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_VIRTUALIZATION_MODE_HOST_VGPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGpuFabricInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGpuFabricInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPowerUsage", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetFanSpeed", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PAGE_RETIREMENT_CAUSE_DOUBLE_BIT_ECC_ERROR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L5", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_DEVICE_STREAMING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuProcessUtilizationSample_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuProcessUtilizationSample_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetSupportedMemoryClocks", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_SYNC_BOOST", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_SYMBOL_ERRORS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_RESTRICTED_API_SET_APPLICATION_CLOCKS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_STATE_UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksThrottleReasonNone", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_GPU_FRU_PART_NUMBER_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlUnitGetUnitInfo", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuLicenseInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuLicenseInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_TEXTURE_SHM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_NVLINK_BW_MODE_FULL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetMemClkVfOffset", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_15", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_3_SLICE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VALUE_TYPE_UNSIGNED_SHORT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPendingDramEncryptionMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetTemperature", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetDefaultFanSpeed_v2", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_INFOROM_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_POWER_STATE_HIGH_SPEED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_VBIOS_VERSION_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_2_SLICE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_6_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetInforomVersion", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_DEVICE_TYPE_UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPerformanceState", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_ARCH_HOPPER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_FEATURE_CODE_COMPUTE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_UUID_LEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksThrottleReasonSwThermalSlowdown", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlNvLinkPowerThres_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlNvLinkPowerThres_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_G781", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlWorkloadPowerProfileProfilesInfo_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlUnitGetTemperature", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlShutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_AGG_L2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_NOP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_CAP_CAS128", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuSchedulerSetState_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuSchedulerSetState_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCurrPcieLinkGeneration", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMPSComputeRunningProcesses", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCapabilities", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_TOTAL_APP_CLOCKS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_LM89", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_RETIRED_DBE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlFlagForce", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L12_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_ADMIN_OVERRIDE_RAMP_DOWN_RATE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetNvLinkState", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_BUFFER_OVERRUN_ERRORS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MEMORY_ERROR_TYPE_CORRECTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VALUE_NOT_AVAILABLE_ulonglong", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGpuInstancePossiblePlacements", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GSP_FIRMWARE_VERSION_BUF_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_SCOPE_GPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_VOL_L1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PERF_POLICY_POWER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_UNSUPPORTED_REQ", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_ADT7461", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpmSampleGet", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetEccMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.c_nvmlGpmSample_t", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_DEVICE_MEMORY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetDramEncryptionMode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_TARGET_VCD_OUTLET", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetBAR1MemoryInfo", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetArchitecture", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_INTEGER_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_NVIDIA_VPC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ROUTE_UNHEALTHY_TRUE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetDefaultAutoBoostedClocksEnabled", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_AGG_L1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_8_SLICE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceResetNvLinkErrorCounters", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetNvLinkUtilizationControl", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L6", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlComputeInstanceInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlComputeInstanceInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_GPU_PART_NUMBER_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetNvLinkUtilizationCounter", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_VERSION_3_1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventTypePState", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PERF_POLICY_THERMAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_AGG_CBU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_7_SLICE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventTypeAll", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_REGISTER_FILE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetClock", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMaxPcieLinkWidth", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RCV_GENERAL_ERRORS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlUnitGetDevices", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceQueryDrainState", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_4_SLICE_GFX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_CAP_MULTI_VGPU_EXCLUSIVE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_DRIVER_NOT_LOADED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_DRIVER_CAP_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_INFOROM_POWER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuInstancesUtilizationInfo_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuInstancesUtilizationInfo_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMultiGpuBoard", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlViolationTime_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlViolationTime_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L11", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_L0_TO_RECOVERY_COUNTER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_ENGINE_PROFILE_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ERROR_DL_REPLAY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_CAP_SYSMEM_ACCESS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetVgpuSchedulerState", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlPowerValue_v2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_PART_NUMBER_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_FEATURE_CODE_GAMING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CLOCK_GRAPHICS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceWorkloadPowerProfileSetRequestedProfiles", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMigDeviceHandleByIndex", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetRemappedRows", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_VGPU_ECC_NOT_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_5_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetInforomImageVersion", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_WIDTH_ROUTE_RECOVERY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetUUID", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_TOTAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PERF_POLICY_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L6", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_PROFILE_RAMP_UP_RATE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetComputeRunningProcesses", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_REPLAY_COUNTER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CLOCK_VIDEO", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpmQueryDeviceSupport", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_1_SLICE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGridLicensableFeatures_v3_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGridLicensableFeatures_v3_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L5", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlWorkloadPowerProfileCurrentProfiles_v1_t", "methods": [ { "kind": "function", "name": "c_nvmlWorkloadPowerProfileCurrentProfiles_v1_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlWorkloadPowerProfileCurrentProfiles_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_LINK_KEEP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_FATAL_ERROR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlMask255_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlMask255_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_CRC_FLIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L4_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_AGG_REG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_5_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetNvLinkCapability", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_INFOROM_ECC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCoolerInfo", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGpuThermalSensor_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGpuThermalSensor_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGpmSupport_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGpmSupport_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_2_SLICE_GFX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_DRAM_BW_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlUnitGetCount", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlFlagDefault", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDevicePowerSmoothingUpdatePresetProfileParam", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlNvlinkSupportedBwModes_v1_t", "methods": [ { "kind": "function", "name": "c_nvmlNvlinkSupportedBwModes_v1_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlNvlinkSupportedBwModes_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpmMetricsGet", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_3_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_12", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_MIN_PERCENT_TMP_FLOOR_SETTING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_CAP_SWAP32", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_SCHEDULER_ARR_DEFAULT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlProcessDetailList_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlProcessDetailList_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "c_nvmlProcessDetailList_v1_t._fmt_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_DRIVER_CAP_HETEROGENEOUS_MULTI_VGPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L3_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_POWER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMPSComputeRunningProcesses_v3", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_DEVICE_TYPE_IBMNPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L5", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlGpuInstanceProfileInfo_v2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_HPC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceWorkloadPowerProfileGetProfilesInfo", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetPersistenceMode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L5", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetRunningProcessDetailList", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetFBCStats", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlUnitGetFanSpeedInfo", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlEventSetWait_v2", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_P2P_STATUS_OK", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetVmDriverVersion", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlMemory_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlMemory_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "c_nvmlMemory_t._fmt_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_NON_FATAL_ERROR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetTargetFanSpeed", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGpuFabricInfo", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_EFFECTIVE_ERRORS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemGetCudaDriverVersion_v2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_MINI_QUARTER_GPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_PCI_BUS_ID_FMT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_STATE_NOT_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuTypeGetMaxInstancesPerVm", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_VOL_L2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_1_SLICE_REV1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetAccountingMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGpuInstancePlacement_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGpuInstancePlacement_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlConfComputeSystemCaps_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlConfComputeSystemCaps_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RCV_PACKETS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemGetNVMLVersion", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetApplicationsClocks", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GOM_ALL_ON", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetNvLinkRemoteDeviceType", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuSchedulerParams_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuSchedulerParams_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetSupportedPerformanceStates", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_SOURCE_BATTERY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_SCOPE_MEMORY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPcieThroughput", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksEventReasonHwPowerBrakeSlowdown", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGetVgpuVersion", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_CPU_CAPS_AMD_SNP_VTOM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetDeviceHandleFromMigDeviceHandle", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceOnSameBoard", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_INIT_FLAG_NO_GPUS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_OPERATING_SYSTEM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksEventReasonAll", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetSerial", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.ConfComputeSetKeyRotationThresholdInfo_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_DEGRADED_BW_NOT_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetUUID", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_UTILIZATION_DOMAIN_GPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetFanSpeed_v2", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L0_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_REMAPPED_PENDING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGetExcludedDeviceInfoByIndex", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_COOLER_TARGET_NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L11", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetAccountingPids", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_SCHEDULER_POLICY_UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetClkMonStatus", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetVgpuUtilization", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPlatformInfo", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_PROFILE_RAMP_DOWN_RATE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.libLoadLock", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DETACH_GPU_REMOVE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_DFMA_TENSOR_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MAX_GPU_UTILIZATIONS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_GPU_IS_LOST", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L9", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_DEVTOOLS_MODE_ON", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlSystemDriverBranchInfo_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlSystemDriverBranchInfo_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGridLicensableFeature_v2_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGridLicensableFeature_v2_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlPowerValue_v2_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlPowerValue_v2_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "c_nvmlPowerValue_v2_t._fmt_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlDeviceAttributes", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlDeviceAttributes._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEC_UTILIZATION_SAMPLES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_ECC_LANE2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_ANY_TENSOR_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_UUID_V2_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.struct_c_nvmlGpmSample_t", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetFBCSessions", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemSetNvlinkBwMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_CAP_CAS64", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPowerSource", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_10", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_REPLAY_ROLLOVER_COUNTER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_CEC_ATTESTATION_REPORT_PRESENT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuSchedDataWithARR_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuSchedDataWithARR_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksEventReasonSwPowerCap", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L11_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuTypeGetGpuInstanceProfileId", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_FP64_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_VOL_L1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_CAP_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceClearAccountingPids", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ENCODER_QUERY_H264", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGridLicensableFeatures_v4", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_VOL_TEX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_STATE_UNLICENSED_RESTRICTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_LM64", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_MAX_LINKS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetGpuOperationMode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_TARGET_BOARD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetSupportedClocksThrottleReasons", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_WIDTH_DEGRADED_BW", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMemClkMinMaxVfOffset", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_MIG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_L2_CACHE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemGetTopologyGpuSet", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlC2cModeInfo_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlC2cModeInfo_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemGetCudaDriverVersion", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_NAME_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventTypeGpuUnavailableError", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_ADMIN_OVERRIDE_RAMP_UP_RATE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L11", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_1_SLICE_GFX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_WIDTH_ACCESS_TIMEOUT_RECOVERY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetAPIRestriction", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlTemperature_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L16_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_ENABLED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_SHIFT_ACCESS_TIMEOUT_RECOVERY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_P2P_CAPS_INDEX_READ", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuPlacementId_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuPlacementId_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_SYSTEM_NVML_VERSION_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.struct_c_nvmlUnit_t", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_TOTAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L6", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_2_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceClearEccErrorCounts", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RAW_BER_LANE0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PERF_POLICY_BOARD_LIMIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BUS_TYPE_UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_CAP_NVLINK_P2P", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_NOT_READY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_SHUTDOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_RELIABILITY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGpuDynamicPstatesUtilization_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGpuDynamicPstatesUtilization_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L6", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VALUE_TYPE_SIGNED_LONG_LONG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetProcessUtilization", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_NO_PERMISSION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_P2P_STATUS_IOH_TOPOLOGY_NOT_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuPgpuCompatibility_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuPgpuCompatibility_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_POWER_REQUESTED_LIMIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TOTAL_POWER_SAMPLES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuSchedulerCapabilities_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuSchedulerCapabilities_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksThrottleReasonHwThermalSlowdown", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlSystemConfComputeSettings_v1_t", "methods": [ { "kind": "function", "name": "c_nvmlSystemConfComputeSettings_v1_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlSystemConfComputeSettings_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceSetEncoderCapacity", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCurrentDramEncryptionMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_NVIDIA_VAPPS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.VgpuProcessesUtilizationInfo_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpmQueryIfStreamingEnabled", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_6_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_AGG_TEX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlFieldValue_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlFieldValue_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_VM_COMPATIBILITY_LIVE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.VgpuPlacementList_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetSupportedClocksEventReasons", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_C2C_LINK_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetP2PStatus", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_HMMA_TENSOR_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ECC_COUNTER_TYPE_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_FUNCTION_NOT_FOUND", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_CAP_EXCLUSIVE_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetEnforcedPowerLimit", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_STATE_IN_PROGRESS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_7_SLICE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceValidateInforom", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpmSetStreamingEnabled", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_AGG_L2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L11", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_ARGUMENT_VERSION_MISMATCH", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_NVLINK_BW_MODE_OFF", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TEMPERATURE_GPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuProcessesUtilizationInfo_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuProcessesUtilizationInfo_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_VM_COMPATIBILITY_SLEEP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGpcClkVfOffset", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_VIRTUALIZATION_MODE_NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlDevicePerfModes_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceRemoveGpu", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_LINK_SHUT_DOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_CORRUPTED_INFOROM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_CBU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CLOCK_ID_CURRENT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetRetiredPagesPendingStatus", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DRIVER_MCDM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemGetConfComputeSettings", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.convertStrBytes", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_LIB_RM_VERSION_MISMATCH", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlComputeInstanceDestroy", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_ERROR_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_CAP_VALID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTEMODE_PROHIBITED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_THROUGHPUT_RAW_RX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_DEVTOOLS_MODE_OFF", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L2_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_UNIT_RESERVED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L9", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_0_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMemClkVfOffset", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L7", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.struct_c_nvmlEventSet_t", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetViolationStatus", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_VOL_REG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_LOW_POWER_THRESHOLD_RESET", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BUS_TYPE_PCIE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPendingGpuOperationMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetLicenseStatus", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlTemperature_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlTemperature_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_COOLER_SIGNAL_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.nvmlClkMonStatus_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "nvmlClkMonStatus_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_CAP_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_GRID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RAW_BER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDevicePowerSmoothingSetState", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_LINK_MAX_SPEED_16000MBPS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.ProcessesUtilizationInfo_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlFBCStats_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlFBCStats_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlGpuFabricInfo_v2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_4_SLICE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_TOTAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetLicenseInfo", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_DRAIN_AND_RESET_STATUS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuTypeGetCapabilities", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ROUTE_UNHEALTHY_FALSE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_CAP_P2P_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L11", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlPowerSmoothingState_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_1_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RCV_BYTES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_TOTAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlProcessesUtilizationInfo_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlProcessesUtilizationInfo_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_LCRC_ERROR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetAutoBoostedClocksEnabled", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_SYMBOL_BER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetBoardId", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_TEMPERATURE_MEM_MAX_TLIMIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPendingEccMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_COMPATIBILITY_LIMIT_GUEST_DRIVER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpuInstanceGetComputeInstances", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlPowerSmoothingState_v1_t", "methods": [ { "kind": "function", "name": "c_nvmlPowerSmoothingState_v1_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlPowerSmoothingState_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_LOW_POWER_THRESHOLD_MIN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L16_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGpuInstanceById", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_NVS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DETACH_GPU_KEEP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TOPOLOGY_INTERNAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_RETIRED_SBE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemGetNvlinkBwMode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_PGPU_HETEROGENEOUS_MODE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlDeviceCapabilities_v1_t", "methods": [ { "kind": "function", "name": "c_nvmlDeviceCapabilities_v1_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlDeviceCapabilities_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_VOL_TOTAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PROCESS_MODE_MPS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_KEY_ROTATION_THRESH_ATTACKER_ADVANTAGE_MIN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_NVIDIA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCreatableVgpus", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L7", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_LM99", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_GPU_CEC_NONCE_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMPSComputeRunningProcesses_v2", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetVgpuTypeSupportedPlacements", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemGetHicVersion", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_SUPPORTED_VGPU_SCHEDULER_POLICY_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.VgpuHeterogeneousMode_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_DRIVER_CAP_WARM_UPDATE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_WIDTH_ROUTE_UNHEALTHY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlEventData_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlEventData_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "c_nvmlEventData_t._fmt_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L10_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DRIVER_WDDM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlBridgeChipHierarchy_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlBridgeChipHierarchy_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_QUADRO", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_UNIT_BYTES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_POWER_THRESHOLD_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_EFFECTIVE_BER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L11", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_SCHEDULER_ARR_DISABLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_MAX_P", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_POWER_INSTANT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMemoryErrorCounter", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_HOST_VGPU_MODE_NON_SRIOV", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetVmID", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksThrottleReasonHwSlowdown", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L7_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlMarginTemperature_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L13_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetComputeInstanceId", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_LLM_TRAINING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_VM_ID_DOMAIN_ID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L9", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_UTILIZATION_SAMPLES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_LINK_MAX_SPEED_2500MBPS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L1_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PERF_POLICY_SYNC_BOOST", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BUS_TYPE_PCI", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuSchedulerLogEntry_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuSchedulerLogEntry_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetClockInfo", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventTypeSingleBitEccError", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BUS_TYPE_AGP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlWorkloadPowerProfileInfo_v1_t", "methods": [ { "kind": "function", "name": "c_nvmlWorkloadPowerProfileInfo_v1_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlWorkloadPowerProfileInfo_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetAPIRestriction", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_P2P_CAPS_INDEX_PROP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemGetConfComputeCapabilities", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuSchedSetData_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuSchedSetData_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetInforomConfigurationChecksum", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGpcClkMinMaxVfOffset", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_TOTAL_ENERGY_CONSUMPTION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_STATE_SLEEP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_ACOUSTIC_MIN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceClearCpuAffinity", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VALUE_TYPE_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCurrPcieLinkWidth", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_RETIRED_PENDING_DBE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetMemoryLockedClocks", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetMetadata", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_ADT7473S", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetFieldValues", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlWorkloadPowerProfileInfo_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetMigMode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FBC_SESSION_TYPE_HWENC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuTypeGetLicense", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_12", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPowerManagementMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REMOTE_NVLINK_ID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlEventSetWait", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_VOL_REG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuTypeGetMaxInstances", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPgpuMetadataString", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetEccMode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_JPG_UTILIZATION_SAMPLES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_7_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetGpcClkVfOffset", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_MULTIGPU_NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CLOCK_MEM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceRegisterEvents", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlComputeInstanceProfileInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlComputeInstanceProfileInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetFanControlPolicy_v2", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetEncoderSessions", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemGetConfComputeGpusReadyState", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_SPEED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_LINK_RECOVERY_EVENTS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_TITAN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetProcessesUtilizationInfo", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_TOTAL_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L15_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMemoryAffinity", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_OUTBOUND_ATOMICS_MASK", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_RETIRED_PENDING_SBE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPciInfo_v3", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuTypeGetFbReservation", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceCreateGpuInstanceWithPlacement", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_SCHEDULER_ARR_ENABLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_FEATURE_CODE_VGPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGridLicensableFeature_v3_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGridLicensableFeature_v3_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_VM_ID_UUID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_VOL_CBU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_IMM_RAMP_DOWN_ENABLED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_RESTRICTED_API_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRICS_GET_VERSION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_GEFORCE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_ARCH_KEPLER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L7", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetConfComputeGpuCertificate", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDevicePowerSmoothingActivatePresetProfile", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_TEXTURE_MEMORY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetDynamicPstatesInfo", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetNumFans", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_RESET_REQUIRED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L7", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L6_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L11", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_LINK_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L10", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DOUBLE_BIT_ECC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_CPU_CAPS_INTEL_TDX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_ARCH_BLACKWELL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ROUTE_UNHEALTHY_NOT_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_CAP_P2P_ATOMICS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetDetailedEccErrors", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ENCODER_QUERY_HEVC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_P2P_CAPS_INDEX_NVLINK", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_ECC_DATA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetVgpuSchedulerCapabilities", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGpuFabricInfoV_t", "methods": [ { "kind": "function", "name": "c_nvmlGpuFabricInfoV_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGpuFabricInfoV_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L5_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_POWER_THRESHOLD_UNITS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_ENVIRONMENT_PROD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CLOCK_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ECC_ERROR_TYPE_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_IMMA_TENSOR_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlUnitGetDeviceCount", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_ARCH_ADA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlEventSetFree", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_CAP_SYSMEM_ATOMICS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuTypeGetFramebufferSize", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_RESET_STATUS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_VM_COMPATIBILITY_NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlUnitGetHandleByIndex", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_LOW_UTILIZATION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpuInstanceDestroy", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlDeviceCurrentClockFreqs_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_TEMPERATURE_SLOWDOWN_TLIMIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_RECOVERY_ACTION_NODE_REBOOT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FEATURE_DISABLED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FBC_SESSION_TYPE_UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_ADMIN_OVERRIDE_PERCENT_TMP_FLOOR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_LIBRARY_NOT_FOUND", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_STATE_ACTIVE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FAN_FAILED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_RECEIVER_ERROR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetVgpuHeterogeneousMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetVgpuHeterogeneousMode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlUnitInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlUnitInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGridLicenseExpiry_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGridLicenseExpiry_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_ECC_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlValue_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlValue_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VALUE_TYPE_UNSIGNED_LONG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMinMaxFanSpeed", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGpuMaxPcieLinkGeneration", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetDecoderUtilization", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_AGG_DEV", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.nvmlFriendlyObject", "methods": [ { "kind": "function", "name": "nvmlFriendlyObject.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "nvmlFriendlyObject.__str__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetTemperatureThreshold", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L10", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_VERSION_2_0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetRetiredPages_v2", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_WRITE_DEVICE_BUFFER_BW", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L6", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlNvlinkSetBwMode_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlRowRemapperHistogramValues", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlRowRemapperHistogramValues._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlPlatformInfo_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L12_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceDiscoverGpus", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ROUTE_RECOVERY_NOT_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MEMORY_UTILIZATION_SAMPLES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_TARGET_VCD_BOARD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlUnitGetLedState", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlLib", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVSWITCH_CONNECTED_LINK_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_CERT_CHAIN_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_SMOOTHING_PROFILE_PARAM_RAMP_DOWN_RATE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCudaComputeCapability", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.VgpuTypeBar1Info_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMemoryBusWidth", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_ADMIN_OVERRIDE_RAMP_DOWN_HYST_VAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_NVSYSCON_CANOAS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MAX_GPC_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetAccountingPids", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_HOST_VGPU_MODE_SRIOV", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_VERSION_4_0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetAccountingMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlMarginTemperature_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlMarginTemperature_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_3_SLICE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetVbiosVersion", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_SOURCE_AC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlConfComputeGpuCertificate_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlConfComputeGpuCertificate_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_COOLER_SIGNAL_VARIABLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L10", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_ACTIVE_PRESET_PROFILE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGpuInstanceRemainingCapacity", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BUS_TYPE_FPCI", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L11_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetEccMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlSystemConfComputeSettings_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_ARCH_TURING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_CAP_CAS32", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRIDGE_CHIP_BRO4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_OFA_UTILIZATION_SAMPLES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_GPS_CURR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_11", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_VERSION_5_0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_DCPCIE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_INSTANCE_GUEST_INFO_STATE_UNINITIALIZED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_GPU_ATTESTATION_REPORT_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_VERSION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_ARCH_VOLTA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PROCESS_MODE_COMPUTE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_INSUFFICIENT_RESOURCES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_FEATURE_CODE_NVIDIA_RTX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGetVgpuCompatibility", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_SCHEDULER_POLICY_EQUAL_SHARE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetEncoderCapacity", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksThrottleReasonSwPowerCap", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetBrand", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.MAX_CLK_DOMAINS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MEMORY_ERROR_TYPE_UNCORRECTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_2_SLICE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemSetConfComputeGpusReadyState", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.struct_c_nvmlGpuInstance_t", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetHandleByUUID", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetAdaptiveClockInfoStatus", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_PGPU_HOMOGENEOUS_MODE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_SCOPE_MODULE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetName", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlUtilization_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlUtilization_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "c_nvmlUtilization_t._fmt_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlEccErrorCounts_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlEccErrorCounts_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FAN_POLICY_MANUAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_ACCEPTING_CLIENT_REQUESTS_TRUE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_AGG_TOTAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_METADATA_OPAQUE_DATA_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L2_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_CEC_ATTESTATION_REPORT_NOT_PRESENT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuSchedData_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuSchedData_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCurrentEccMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PERF_POLICY_TOTAL_BASE_CLOCKS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L7", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetVgpuSchedulerLog", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_LINK_MAX_SPEED_64000MBPS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_ENVIRONMENT_UNAVAILABLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_NAKS_SENT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_WRITE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_SINGLE_BIT_ECC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPowerManagementDefaultLimit", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksEventReasonHwSlowdown", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L6", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L14_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMemoryInfo", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetNvLinkDeviceLowPowerThreshold", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_FEATURE_MAX_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_TARGET_MEMORY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetConfComputeProtectedMemoryUsage", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ENERGY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_VOL_TOTAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_NVLINK_BW_MODE_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlFanSpeedInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlFanSpeedInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L5", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlConfComputeGetKeyRotationThresholdInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlConfComputeGetKeyRotationThresholdInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_VL15_DROPPED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGraphicsRunningProcesses_v2", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetOfaUtilization", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_P2P_STATUS_NOT_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetGpuInstanceId", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_4_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetType", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlUnitSetLedState", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlDeviceCapabilities_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_RETIRED_PENDING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlErrorString", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGridLicensableFeatures_v4_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGridLicensableFeatures_v4_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_SYNC_BALANCED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_COMPATIBILITY_LIMIT_OTHER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_QUADRO_RTX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_SYSTEM_DRIVER_VERSION_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_RECOVERY_ACTION_GPU_RESET", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGspFirmwareVersion", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetVgpuProcessesUtilizationInfo", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlConfComputeMemSizeInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlConfComputeMemSizeInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetFBCStats", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_NVIDIA_VWS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGetExcludedDeviceCount", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RCV_REMOTE_ERRORS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_READ_DEVICE_BUFFER_BW", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_ATTESTATION_CERT_CHAIN_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_TOTAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_AGG_DEV", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ROUTE_RECOVERY_TRUE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_THROUGHPUT_DATA_RX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksThrottleReasonAll", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceCreateGpuInstance", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_DEVICE_TYPE_SWITCH", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L10", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetDriverModel", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_POWER_MAX_LIMIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksEventReasonGpuIdle", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlConfComputeSetKeyRotationThresholdInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlConfComputeSetKeyRotationThresholdInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTEMODE_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ACCESS_TIMEOUT_RECOVERY_FALSE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L6", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.VgpuInstancesUtilizationInfo_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceResetGpuLockedClocks", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuInstanceUtilizationInfo_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuInstanceUtilizationInfo_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceResetMemoryLockedClocks", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlDeviceCurrentClockFreqs_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlDeviceCurrentClockFreqs_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceResetApplicationsClocks", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_1_SLICE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_PGPU_METADATA_OPAQUE_DATA_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventTypeSingleBitEccErrorStorm", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetActiveVgpus", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_GPU_NOT_FOUND", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_TOTAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_CPU_CAPS_AMD_SEV", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ENCODER_QUERY_UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetDefaultEccMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlClockOffset_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlClockOffset_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_COMPUTE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlConfComputeSystemState_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlConfComputeSystemState_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPcieLinkMaxSpeed", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_SAMPLINGTYPE_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_HMMA_DENSE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PROCESS_MODE_GRAPHICS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_TARGET_NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L7", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_RECOVERY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksEventReasonSyncBoost", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetTopologyCommonAncestor", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L8_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPowerManagementLimitConstraints", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetGpuPciId", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMinMaxClockOfPState", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_XMIT_DISCARDS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGraphicsRunningProcesses_v3", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_APPLIED_TMP_CEIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_RESPNODATA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlPSUInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlPSUInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventTypeGpuRecoveryAction", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlAccountingStats_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlAccountingStats_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceModifyDrainState", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_ENVIRONMENT_SIM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetDefaultApplicationsClock", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_GPU_INTERNAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.c_nvmlGpuInstance_t", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuVersion_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuVersion_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_POWER_THRESHOLD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_COOLER_TARGET_GPU_RELATED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTEMODE_EXCLUSIVE_PROCESS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_STATE_INACTIVE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L13_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_7", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_EXPIRY_INVALID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TOPOLOGY_SYSTEM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.c_nvmlEventSet_t", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTEMODE_EXCLUSIVE_THREAD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L10", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuLicenseExpiry_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuLicenseExpiry_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGridLicensableFeature_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGridLicensableFeature_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetConfComputeGpuAttestationReport", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_TARGET_UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetSupportedGraphicsClocks", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_UUID_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_ADM1032", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.nvmlClkMonFaultInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "nvmlClkMonFaultInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMinorNumber", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemGetConfComputeState", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlUnitFanInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlUnitFanInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEV_CAP_EGM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPciInfoExt", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_TITAN_RTX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_COMPATIBILITY_LIMIT_GPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_DEVICE_TYPE_GPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_SERIAL_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_TX_BYTES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksThrottleReasonSyncBoost", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_ARCH_MAXWELL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_VIRTUALIZATION_MODE_PASSTHROUGH", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetComputeMode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_KEY_ROTATION_THRESH_ATTACKER_ADVANTAGE_MAX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.nvmlPciInfo_v2_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "nvmlPciInfo_v2_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "nvmlPciInfo_v2_t._fmt_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlHwbcEntry_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlHwbcEntry_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L7_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_CORRECTABLE_ERRORS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.nvmlPciInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "nvmlPciInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "nvmlPciInfo_t._fmt_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetNvLinkVersion", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MEMORY_ERROR_TYPE_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetDriverModel", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGraphicsRunningProcesses", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_LANE_ERROR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetC2cModeInfoV", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_9", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_AGG_TEX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_UTILIZATION_DOMAIN_VID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L6", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGpuThermalSettings_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGpuThermalSettings_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_POWER_STATE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_UTIL_RX_BYTES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.ConfComputeGetKeyRotationThresholdInfo_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRIDGE_CHIP_PLX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ENC_UTILIZATION_SAMPLES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlMemory_v2_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlMemory_v2_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "c_nvmlMemory_v2_t._fmt_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L17_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TOPOLOGY_NODE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.throwOnVersionMismatch", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetIrqNum", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_VBIOSEVT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_MAX_PERCENT_TMP_FLOOR_SETTING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_NVLINK_BW_MODE_HALF", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_TOTAL_BASE_CLOCKS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuTypeGetDeviceID", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_UTILIZATION_DOMAIN_BUS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CLOCK_ID_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_READ", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_6", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_ECC_LANE1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_XMIT_BYTES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_NVIDIA_CLOUD_GAMING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.nvmlPciInfoExt_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "nvmlPciInfoExt_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "nvmlPciInfoExt_v1_t._fmt_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_DEGRADED_BW_TRUE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetClockOffsets", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L10", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlCoolerInfo_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetPowerManagementLimit", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_RBM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlComputeInstanceProfileInfo_v2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetRetiredPages", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetTopologyNearestGpus", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGridLicensableFeatures", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_UTIL_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMaxPcieLinkGeneration", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_UTILIZATION_DOMAIN_FB", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCurrentDriverModel", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetNvLinkUtilizationControl", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuInstanceUtilizationSample_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuInstanceUtilizationSample_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetJpgUtilization", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_ALREADY_INITIALIZED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_TIMEOUT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpuInstanceCreateComputeInstance", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuTypeGetNumDisplayHeads", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_OPS_MAX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlProcessDetailList_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_CPU_CAPS_AMD_SEV_SNP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_MAX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_NO_DATA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlNvlinkSetBwMode_v1_t", "methods": [ { "kind": "function", "name": "c_nvmlNvlinkSetBwMode_v1_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlNvlinkSetBwMode_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MAX_THERMAL_SENSORS_PER_GPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_MEM_MAX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_HOMOGENEOUS_PLACEMENTS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_TEMPERATURE_SHUTDOWN_TLIMIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_COOLER_SIGNAL_NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemSetConfComputeKeyRotationThresholdInfo", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ERROR_DL_RECOVERY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuTypeGetFrameRateLimit", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L9_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGpmMetric_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGpmMetric_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetHostVgpuMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_P2P_CAPS_INDEX_PCI", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPerformanceModes", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetSamples", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_VOL_DEV", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSetVgpuVersion", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L10_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlComputeInstanceProfileInfo_v2_t", "methods": [ { "kind": "function", "name": "c_nvmlComputeInstanceProfileInfo_v2_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlComputeInstanceProfileInfo_v2_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetFanSpeed_v2", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_THROUGHPUT_RAW_TX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_STATE_UNINITIALIZED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DRIVER_WDM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_REMAPPED_UNC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_POWER_AVERAGE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlBridgeChipInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlBridgeChipInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventTypeNonFatalPoisonError", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_MAX1617", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_COOLER_SIGNAL_TOGGLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPcieReplayCounter", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_UTIL_TX_BYTES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPciInfo", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.c_nvmlUnit_t", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_RECOVERY_ACTION_NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_MIG_ENABLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGpmMetricsGet_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGpmMetricsGet_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetAttributes", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_STATE_UNLICENSED_UNRESTRICTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_GEFORCE_RTX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_LINK_MAX_SPEED_INVALID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L10", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGridLicensableFeature_v4_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGridLicensableFeature_v4_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVOFA_0_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPersistenceMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_GPU_CEC_ATTESTATION_REPORT_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlPciInfoExt_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.c_nvmlDevice_t", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuTypeGetName", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PERF_POLICY_RELIABILITY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_XMIT_PACKETS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetAccountingBufferSize", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpuInstanceGetInfo", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PERF_POLICY_LOW_UTILIZATION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpmSampleFree", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_8_SLICE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuSchedulerLog_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuSchedulerLog_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_AGG_TOTAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventTypeXidCriticalError", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetAccountingStats", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMaxMigDeviceCount", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L9_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_AFFINITY_SCOPE_NODE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_INBOUND_ATOMICS_MASK", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_FREQ_NOT_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMigMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMaxClockInfo", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_NAKS_RECEIVED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_INFOROM_DEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GOM_LOW_DP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_REMAPPED_FAILURE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_9", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_MEMORY_BOUND", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_LED_COLOR_AMBER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_P2P_STATUS_GPU_NOT_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuTypeGetGspHeapSize", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlProcessUtilizationSample_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlProcessUtilizationSample_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L14_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlExcludedDeviceInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlExcludedDeviceInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_13", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_P2P_CAPS_INDEX_WRITE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_FEATURE_CODE_UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_LINK_MAX_SPEED_32000MBPS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L9", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpmSampleAlloc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventTypeClock", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlWorkloadPowerProfileRequestedProfiles_v1_t", "methods": [ { "kind": "function", "name": "c_nvmlWorkloadPowerProfileRequestedProfiles_v1_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlWorkloadPowerProfileRequestedProfiles_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetDisplayActive", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_TOTAL_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetNvlinkSupportedBwModes", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_SUCCESS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ROUTE_RECOVERY_FALSE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetRowRemapperHistogram", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetComputeMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksEventReasonDisplayClockSetting", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetNvlinkBwMode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetApplicationsClock", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ERROR_DL_CRC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_FP32_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VALUE_TYPE_UNSIGNED_INT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VALUE_TYPE_SIGNED_INT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_MAX6649R", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuProcessUtilizationInfo_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuProcessUtilizationInfo_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_REPLAY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_DRAM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksEventReasonApplicationsClocksSetting", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_NOT_FOUND", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlPowerSmoothingProfile_v1_t", "methods": [ { "kind": "function", "name": "c_nvmlPowerSmoothingProfile_v1_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlPowerSmoothingProfile_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetBoardPartNumber", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_RECOVERY_ACTION_DRAIN_P2P", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_1_SLICE_REV1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_FEATURE_DISABLED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_SRAM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_WORKLOAD_POWER_MAX_PROFILES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_P2P_CAPS_INDEX_ATOMICS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlEncoderSession_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlEncoderSession_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ACCESS_TIMEOUT_RECOVERY_NOT_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CLOCK_LIMIT_ID_UNLIMITED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_EXPIRY_VALID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_NETWORK", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_CAP_FETCHADD64", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlWorkloadPowerProfileCurrentProfiles_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetNvLinkRemotePciInfo", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlUnitFanSpeeds_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlUnitFanSpeeds_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TOPOLOGY_HOSTBRIDGE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L5", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuTypeBar1Info_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuTypeBar1Info_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FBC_SESSION_TYPE_TOSYS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_6_SLICE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlPlatformInfo_v1_t", "methods": [ { "kind": "function", "name": "c_nvmlPlatformInfo_v1_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlPlatformInfo_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_IN_USE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_CAP_FETCHADD32", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemGetProcessName", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_P2P_STATUS_CHIPSET_NOT_SUPPORED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_4_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_UNIT_PACKETS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CLOCK_LIMIT_ID_RANGE_START", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksThrottleReasonGpuIdle", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_14", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_LOW_POWER_THRESHOLD_MAX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.nvmlNvLinkUtilizationControl_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "nvmlNvLinkUtilizationControl_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_CRC_DATA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_NVSYSCON_E551", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_RATOM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemGetDriverVersion", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_LOW_POWER_THRESHOLD_UNIT_50US", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MEMORY_CLK_SAMPLES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L17_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_RESTRICTED_API_SET_AUTO_BOOSTED_CLOCKS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_2_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_BAD_TLP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_COOLER_TARGET_GPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_MAX_NUM_PRESET_PROFILES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CLOCK_SM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_PROFILE_PERCENT_TMP_FLOOR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetDisplayMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlNvlinkGetBwMode_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_HETEROGENEOUS_TIMESLICE_SIZES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_PCIE_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetFanSpeedRPM", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlDramEncryptionInfo_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_MAX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_INSUFFICIENT_POWER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceFreezeNvLinkUtilizationCounter", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuPgpuMetadata_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuPgpuMetadata_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MAX_GPU_PERF_PSTATES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_C2C_LINK_GET_STATUS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FBC_SESSION_TYPE_CUDA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGpuInstanceId", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_TARGET_VCD_INLET", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.struct_c_nvmlDevice_t", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_ARCH_T23X", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlProcessInfo_v2_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlProcessInfo_v2_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "c_nvmlProcessInfo_v2_t._fmt_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_C2C_LINK_GET_MAX_BW", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_P2P_CAPS_INDEX_UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L5", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_TARGET_GPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_6_SLICE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CLOCK_ID_APP_CLOCK_TARGET", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.c_nvmlComputeInstance_t", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventTypeDramRetirementFailure", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TEMPERATURE_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlFriendlyObjectToStruct", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_BOARD_LIMIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_HMMA_SPARSE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_7", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetEncoderStats", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_IRQ_ISSUE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_NVIDIA_VCS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GOM_COMPUTE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_NVLINK_BW_MODE_3QUARTER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_GPUS_CC_NOT_CAPABLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_P2P_STATUS_UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetPowerManagementLimit_v2", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_SMOOTHING_MAX_NUM_PROFILES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_INSUFFICIENT_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpuInstanceGetComputeInstanceRemainingCapacity", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VOLATILE_ECC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_GRAPHICS_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_VOL_DEV", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMaxCustomerBoostClock", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlFBCSession_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlFBCSession_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L4_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_EXPIRY_NOT_AVAILABLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlNvlinkGetBwMode_v1_t", "methods": [ { "kind": "function", "name": "c_nvmlNvlinkGetBwMode_v1_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlNvlinkGetBwMode_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetFanControlPolicy", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_THROUGHPUT_DATA_TX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_SOURCE_UNDERSIZED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCpuAffinityWithinScope", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlSample_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlSample_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_CAP_GPUDIRECT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetNvLinkErrorCounter", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetFrameRateLimit", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_SMOOTHING_ADMIN_OVERRIDE_NOT_SET", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlEventSetCreate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetTemperatureThreshold", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceClearFieldValues", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_HETEROGENEOUS_TIMESLICE_PROFILES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_ARCH_AMPERE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_ECC_LANE3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_VERSION_3_0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VALUE_TYPE_UNSIGNED_LONG_LONG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_P2P_STATUS_DISABLED_BY_REGKEY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_LLM_INFERENCE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_SM_OCCUPANCY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_PCI_BUS_ID_LEGACY_FMT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksThrottleReasonHwPowerBrakeSlowdown", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuSchedulerSetParams_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuSchedulerSetParams_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_14", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_STATE_COMPLETED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventTypeDramRetirementEvent", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetComputeRunningProcesses_v2", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceWorkloadPowerProfileGetCurrentProfiles", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventTypeFatalPoisonError", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CLOCK_ID_APP_CLOCK_DEFAULT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetComputeRunningProcesses_v3", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_NVIDIA_RTX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MODULE_POWER_SAMPLES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_FLUSH", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TOPOLOGY_SINGLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlDevicePerfModes_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlDevicePerfModes_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetSupportedEventTypes", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_IS_MIG_MODE_INDEPENDENT_MIG_QUERY_CAPABLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpuInstanceGetComputeInstanceProfileInfo", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVOFA_1_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_SHIFT_ROUTE_RECOVERY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetRuntimeStateSize", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RCV_ERRORS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetConfComputeMemSizeInfo", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetVgpuInstancesUtilizationInfo", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlWorkloadPowerProfileProfilesInfo_v1_t", "methods": [ { "kind": "function", "name": "c_nvmlWorkloadPowerProfileProfilesInfo_v1_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlWorkloadPowerProfileProfilesInfo_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlLedState_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlLedState_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L9", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGpuInstanceProfileInfo", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_COMPUTE_MEDIA_ENGINE_GPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_MEMORY_TEMP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_11", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetFbUsage", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L7", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_EXPIRY_PERMANENT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_VM_COMPATIBILITY_COLD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ADAPTIVE_CLOCKING_INFO_STATUS_ENABLED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_DEPRECATED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_HW_CIRCUITRY_PERCENT_LIFETIME_REMAINING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_FP16_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_NOT_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_SUPPORT_VERSION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetHandleByIndex", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuPlacementList_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuPlacementList_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_PRIV_LVL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_SHIFT_DEGRADED_BW", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGpuOperationMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_INFOROM_OEM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_INIT_FLAG_NO_ATTACH", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_PENDING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.VgpuRuntimeState_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetTemperatureV1", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_SLOWDOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetThermalSettings", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_TARGET_ALL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuSchedulerGetState_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuSchedulerGetState_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetBusType", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetGpuLockedClocks", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_IS_RESETLESS_MIG_SUPPORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemGetDriverBranch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGetVgpuDriverCapabilities", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpuInstanceGetComputeInstancePossiblePlacements", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlNvlinkSupportedBwModes_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetPlacementId", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetEncoderStats", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlComputeInstanceGetInfo", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksEventReasonHwThermalSlowdown", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_SCHEDULER_POLICY_FIXED_SHARE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_ARCH_UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.NVMLLibraryMismatchError", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCurrentClockFreqs", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetClockOffsets", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_COMPATIBILITY_LIMIT_NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_TESLA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FAN_NORMAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_MAX6649", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventTypeDoubleBitEccError", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_MAX_Q", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetAccountingMode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_CAP_SLI_BRIDGE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_TEMPERATURE_GPU_MAX_TLIMIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PERF_MODES_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlSystemGetConfComputeKeyRotationThresholdInfo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetNumaNodeId", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_OS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_2_SLICE_REV1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventTypePowerSourceChange", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PROCESSOR_CLK_SAMPLES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CLOCK_ID_CUSTOMER_BOOST_MAX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetLastBBXFlushTime", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_SMOOTHING_PROFILE_PARAM_RAMP_DOWN_HYSTERESIS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.struct_c_nvmlComputeInstance_t", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlC2cModeInfo_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MAX_PHYSICAL_BRIDGE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_MIG_DISABLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_POWER_CURRENT_LIMIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksThrottleReasonDisplayClockSetting", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L3_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetMarginTemperature", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCurrentGpuOperationMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.SystemDriverBranchInfo_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetC2cModeInfoV1", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetVirtualizationMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksEventReasonSwThermalSlowdown", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_6", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_MULTIGPU_PROTECTED_PCIE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_7_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetUtilizationRates", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetDramEncryptionMode", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCurrentClocksEventReasons", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L9", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_SCHEDULER_SW_MAX_LOG_ENTRIES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_POWER_DEFAULT_LIMIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetModuleId", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCurrentClocksThrottleReasons", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_ADT7473", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCpuAffinity", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_5", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpuInstanceGetComputeInstanceById", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_REMAPPED_COR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlFanSpeedInfo_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_10", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FBC_SESSION_TYPE_VID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetSupportedVgpus", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_ARCH_PASCAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPendingDriverModel", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGpuFabricInfoV", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksEventReasonNone", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetCount", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlBAR1Memory_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlBAR1Memory_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "c_nvmlBAR1Memory_t._fmt_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_PCIE_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_VM_COMPATIBILITY_HIBERNATE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_PROFILE_RAMP_DOWN_HYST_VAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_3_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpuInstanceCreateComputeInstanceWithPlacement", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlExceptionClass", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_VIRTUALIZATION_MODE_VGPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_PROFILE_BALANCED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetAttributes_v2", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetEncoderSessions", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.NVMLError", "methods": [ { "kind": "function", "name": "NVMLError.__new__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NVMLError.__str__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NVMLError.__eq__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NVMLError._valClassMapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NVMLError._errcode_to_string", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGridLicensableFeatures_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGridLicensableFeatures_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlEccSramErrorStatus_v1_t", "methods": [ { "kind": "function", "name": "c_nvmlEccSramErrorStatus_v1_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlEccSramErrorStatus_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_RESPDATA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_TARGET_POWER_SUPPLY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_NAME_V2_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_AGG_L1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetVgpuCapabilities", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlStructToFriendlyObject", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_ACCEPTING_CLIENT_REQUESTS_FALSE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlComputeInstancePlacement_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlComputeInstancePlacement_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_MALFORMED_PACKET_ERRORS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_FEATURE_ENABLED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_INFOROM_VERSION_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_INSTANCE_GUEST_INFO_STATE_INITIALIZED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_GET_GPU_RECOVERY_ACTION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_WARM_UPDATE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetCpuAffinity", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_VERSION_1_0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.VgpuPlacementId_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_STATE_NOT_STARTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_DEGRADED_BW_FALSE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlConfComputeGpuAttestationReport_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlConfComputeGpuAttestationReport_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_RECOVERY_ACTION_DRAIN_AND_RESET", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetBridgeChipInfo", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_SHIFT_ROUTE_UNHEALTHY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_CAP_SWAP64", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGpuInstanceProfileInfo_v2_t", "methods": [ { "kind": "function", "name": "c_nvmlGpuInstanceProfileInfo_v2_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGpuInstanceProfileInfo_v2_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_13", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetConfComputeUnprotectedMemSize", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PERF_POLICY_TOTAL_APP_CLOCKS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.VgpuPlacementList_v2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FAN_POLICY_TEMPERATURE_CONTINOUS_SW", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_POWER_THRESHOLD_MIN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlGpmMigSampleGet", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_INVALID_ARGUMENT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGpuInstanceProfileInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGpuInstanceProfileInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_SM_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetEncoderUtilization", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGpuDynamicPstatesInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGpuDynamicPstatesInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_AFFINITY_SCOPE_SOCKET", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_LINK_RECOVERY_SUCCESSFUL_EVENTS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_MEMORY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_INVALID_STATE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGpuInstanceInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGpuInstanceInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetHandleByPciBusId", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_COMMON", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_FEATURE_CODE_VWORKSTATION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTEMODE_DEFAULT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuTypeGetClass", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_UNIT_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_UNKNOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_MAX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetLicenseInfo_v2", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_POWER_MIN_LIMIT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PAGE_RETIREMENT_CAUSE_MULTIPLE_SINGLE_BIT_ECC_ERRORS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetVgpuSchedulerState", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetTotalEnergyConsumption", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_5", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_ALL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ENCODER_QUERY_AV1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlProcessUtilizationInfo_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlProcessUtilizationInfo_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_SCHEDULER_POLICY_BEST_EFFORT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_PCI_BUS_ID_BUFFER_V2_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_GPU_MAX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_LOW_POWER_THRESHOLD_UNIT_100US", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceWorkloadPowerProfileClearRequestedProfiles", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CC_SYSTEM_GPUS_CC_CAPABLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_AGGREGATE_ECC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ACCESS_TIMEOUT_RECOVERY_TRUE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_ERROR_UNINITIALIZED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_metricInfo_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_metricInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_STATE_UNLICENSED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetMdevUUID", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_VOL_TEX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetNumGpuCores", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FEATURE_ENABLED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClocksThrottleReasonApplicationsClocksSetting", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceSetNvlinkBwMode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_VOL_L2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuSchedSetDataWithARR_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuSchedSetDataWithARR_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_NAME_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VALUE_TYPE_DOUBLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_RX_BYTES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_0_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_ECC_LANE0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PCIE_LINK_MAX_SPEED_5000MBPS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PSTATE_15", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_NRATOM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlInit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_CURRENT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_UNIT_CYCLES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetEncoderCapacity", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GRID_LICENSE_STATE_LICENSED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_VERSION_INVALID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceResetNvLinkUtilizationCounter", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_LINK_RECOVERY_FAILED_EVENTS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_FRACTIONAL_MULTI_VGPU", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetTemperatureV", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_VERSION_2_2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L7", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_VGPU_CAP_EXCLUSIVE_TYPE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_1_UTIL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlMemory_v2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_APPLIED_TMP_FLOOR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_TOTAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_NVLINK_POWER_STATE_LOW", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlDramEncryptionInfo_t", "methods": [ { "kind": "function", "name": "c_nvmlDramEncryptionInfo_t.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlDramEncryptionInfo_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TOPOLOGY_MULTIPLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L15_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L6_RX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuInstanceGetAccountingStats", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_AGG_REG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPU_NVLINK_BW_MODE_MIN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuMetadata_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuMetadata_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_LED_COLOR_GREEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlGridLicensableFeatures_v2_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlGridLicensableFeatures_v2_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuTypeGetBAR1Info", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_PAGE_RETIREMENT_CAUSE_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetSramEccErrorStatus", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L0_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L9", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L5_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetIndex", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEccSramErrorStatus_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_SBMAX6649", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPowerManagementLimit", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_4_SLICE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlEventTypeNone", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L10", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlProcessDetail_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlProcessDetail_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_CLOCK_LIMIT_ID_TDP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlInitWithFlags", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RAW_BER_LANE1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlVgpuTypeGetResolution", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_THERMAL_COOLER_TARGET_MEMORY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_ACOUSTIC_CURR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.pynvml.c_nvmlVgpuHeterogeneousMode_v1_t", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "c_nvmlVgpuHeterogeneousMode_v1_t._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlUnitGetPsuInfo", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.nvmlClockOffset_v1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlComputeInstanceGetInfo_v2", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_BRAND_COUNT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetGpuInstances", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_BAD_DLLP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L1_TX_PER_SEC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L9", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_POWER_THRESHOLD_MAX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_DEVICE_PCI_BUS_ID_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetPcieSpeed", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_LOCAL_LINK_INTEGRITY_ERRORS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_POWER_SMOOTHING_PROFILE_PARAM_PERCENT_TMP_FLOOR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_L1_CACHE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.pynvml.nvmlDeviceGetVgpuCapabilities", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.third_party.pynvml", "names": [ "vllm.third_party.pynvml.ConfComputeGetKeyRotationThresholdInfo_v1", "vllm.third_party.pynvml.ConfComputeSetKeyRotationThresholdInfo_v1", "vllm.third_party.pynvml.MAX_CLK_DOMAINS", "vllm.third_party.pynvml.NVMLError", "vllm.third_party.pynvml.NVMLLibraryMismatchError", "vllm.third_party.pynvml.NVML_ADAPTIVE_CLOCKING_INFO_STATUS_DISABLED", "vllm.third_party.pynvml.NVML_ADAPTIVE_CLOCKING_INFO_STATUS_ENABLED", "vllm.third_party.pynvml.NVML_AFFINITY_SCOPE_NODE", "vllm.third_party.pynvml.NVML_AFFINITY_SCOPE_SOCKET", "vllm.third_party.pynvml.NVML_AGGREGATE_ECC", "vllm.third_party.pynvml.NVML_BRAND_COUNT", "vllm.third_party.pynvml.NVML_BRAND_GEFORCE", "vllm.third_party.pynvml.NVML_BRAND_GEFORCE_RTX", "vllm.third_party.pynvml.NVML_BRAND_GRID", "vllm.third_party.pynvml.NVML_BRAND_NVIDIA", "vllm.third_party.pynvml.NVML_BRAND_NVIDIA_CLOUD_GAMING", "vllm.third_party.pynvml.NVML_BRAND_NVIDIA_RTX", "vllm.third_party.pynvml.NVML_BRAND_NVIDIA_VAPPS", "vllm.third_party.pynvml.NVML_BRAND_NVIDIA_VCS", "vllm.third_party.pynvml.NVML_BRAND_NVIDIA_VPC", "vllm.third_party.pynvml.NVML_BRAND_NVIDIA_VWS", "vllm.third_party.pynvml.NVML_BRAND_NVS", "vllm.third_party.pynvml.NVML_BRAND_QUADRO", "vllm.third_party.pynvml.NVML_BRAND_QUADRO_RTX", "vllm.third_party.pynvml.NVML_BRAND_TESLA", "vllm.third_party.pynvml.NVML_BRAND_TITAN", "vllm.third_party.pynvml.NVML_BRAND_TITAN_RTX", "vllm.third_party.pynvml.NVML_BRAND_UNKNOWN", "vllm.third_party.pynvml.NVML_BRIDGE_CHIP_BRO4", "vllm.third_party.pynvml.NVML_BRIDGE_CHIP_PLX", "vllm.third_party.pynvml.NVML_BUS_TYPE_AGP", "vllm.third_party.pynvml.NVML_BUS_TYPE_FPCI", "vllm.third_party.pynvml.NVML_BUS_TYPE_PCI", "vllm.third_party.pynvml.NVML_BUS_TYPE_PCIE", "vllm.third_party.pynvml.NVML_BUS_TYPE_UNKNOWN", "vllm.third_party.pynvml.NVML_CC_ACCEPTING_CLIENT_REQUESTS_FALSE", "vllm.third_party.pynvml.NVML_CC_ACCEPTING_CLIENT_REQUESTS_TRUE", "vllm.third_party.pynvml.NVML_CC_CEC_ATTESTATION_REPORT_NOT_PRESENT", "vllm.third_party.pynvml.NVML_CC_CEC_ATTESTATION_REPORT_PRESENT", "vllm.third_party.pynvml.NVML_CC_GPU_ATTESTATION_REPORT_SIZE", "vllm.third_party.pynvml.NVML_CC_GPU_CEC_ATTESTATION_REPORT_SIZE", "vllm.third_party.pynvml.NVML_CC_GPU_CEC_NONCE_SIZE", "vllm.third_party.pynvml.NVML_CC_KEY_ROTATION_THRESH_ATTACKER_ADVANTAGE_MAX", "vllm.third_party.pynvml.NVML_CC_KEY_ROTATION_THRESH_ATTACKER_ADVANTAGE_MIN", "vllm.third_party.pynvml.NVML_CC_SYSTEM_CPU_CAPS_AMD_SEV", "vllm.third_party.pynvml.NVML_CC_SYSTEM_CPU_CAPS_AMD_SEV_SNP", "vllm.third_party.pynvml.NVML_CC_SYSTEM_CPU_CAPS_AMD_SNP_VTOM", "vllm.third_party.pynvml.NVML_CC_SYSTEM_CPU_CAPS_INTEL_TDX", "vllm.third_party.pynvml.NVML_CC_SYSTEM_CPU_CAPS_NONE", "vllm.third_party.pynvml.NVML_CC_SYSTEM_DEVTOOLS_MODE_OFF", "vllm.third_party.pynvml.NVML_CC_SYSTEM_DEVTOOLS_MODE_ON", "vllm.third_party.pynvml.NVML_CC_SYSTEM_ENVIRONMENT_PROD", "vllm.third_party.pynvml.NVML_CC_SYSTEM_ENVIRONMENT_SIM", "vllm.third_party.pynvml.NVML_CC_SYSTEM_ENVIRONMENT_UNAVAILABLE", "vllm.third_party.pynvml.NVML_CC_SYSTEM_FEATURE_DISABLED", "vllm.third_party.pynvml.NVML_CC_SYSTEM_FEATURE_ENABLED", "vllm.third_party.pynvml.NVML_CC_SYSTEM_GPUS_CC_CAPABLE", "vllm.third_party.pynvml.NVML_CC_SYSTEM_GPUS_CC_NOT_CAPABLE", "vllm.third_party.pynvml.NVML_CC_SYSTEM_MULTIGPU_NONE", "vllm.third_party.pynvml.NVML_CC_SYSTEM_MULTIGPU_PROTECTED_PCIE", "vllm.third_party.pynvml.NVML_CLOCK_COUNT", "vllm.third_party.pynvml.NVML_CLOCK_GRAPHICS", "vllm.third_party.pynvml.NVML_CLOCK_ID_APP_CLOCK_DEFAULT", "vllm.third_party.pynvml.NVML_CLOCK_ID_APP_CLOCK_TARGET", "vllm.third_party.pynvml.NVML_CLOCK_ID_COUNT", "vllm.third_party.pynvml.NVML_CLOCK_ID_CURRENT", "vllm.third_party.pynvml.NVML_CLOCK_ID_CUSTOMER_BOOST_MAX", "vllm.third_party.pynvml.NVML_CLOCK_LIMIT_ID_RANGE_START", "vllm.third_party.pynvml.NVML_CLOCK_LIMIT_ID_TDP", "vllm.third_party.pynvml.NVML_CLOCK_LIMIT_ID_UNLIMITED", "vllm.third_party.pynvml.NVML_CLOCK_MEM", "vllm.third_party.pynvml.NVML_CLOCK_SM", "vllm.third_party.pynvml.NVML_CLOCK_VIDEO", "vllm.third_party.pynvml.NVML_COMPUTEMODE_COUNT", "vllm.third_party.pynvml.NVML_COMPUTEMODE_DEFAULT", "vllm.third_party.pynvml.NVML_COMPUTEMODE_EXCLUSIVE_PROCESS", "vllm.third_party.pynvml.NVML_COMPUTEMODE_EXCLUSIVE_THREAD", "vllm.third_party.pynvml.NVML_COMPUTEMODE_PROHIBITED", "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_ENGINE_PROFILE_COUNT", "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_ENGINE_PROFILE_SHARED", "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_1_SLICE", "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_1_SLICE_REV1", "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_2_SLICE", "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_3_SLICE", "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_4_SLICE", "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_6_SLICE", "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_7_SLICE", "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_8_SLICE", "vllm.third_party.pynvml.NVML_COMPUTE_INSTANCE_PROFILE_COUNT", "vllm.third_party.pynvml.NVML_DEC_UTILIZATION_SAMPLES", "vllm.third_party.pynvml.NVML_DETACH_GPU_KEEP", "vllm.third_party.pynvml.NVML_DETACH_GPU_REMOVE", "vllm.third_party.pynvml.NVML_DEVICE_ARCH_ADA", "vllm.third_party.pynvml.NVML_DEVICE_ARCH_AMPERE", "vllm.third_party.pynvml.NVML_DEVICE_ARCH_BLACKWELL", "vllm.third_party.pynvml.NVML_DEVICE_ARCH_HOPPER", "vllm.third_party.pynvml.NVML_DEVICE_ARCH_KEPLER", "vllm.third_party.pynvml.NVML_DEVICE_ARCH_MAXWELL", "vllm.third_party.pynvml.NVML_DEVICE_ARCH_PASCAL", "vllm.third_party.pynvml.NVML_DEVICE_ARCH_T23X", "vllm.third_party.pynvml.NVML_DEVICE_ARCH_TURING", "vllm.third_party.pynvml.NVML_DEVICE_ARCH_UNKNOWN", "vllm.third_party.pynvml.NVML_DEVICE_ARCH_VOLTA", "vllm.third_party.pynvml.NVML_DEVICE_GPU_FRU_PART_NUMBER_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_DEVICE_GPU_PART_NUMBER_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_DEVICE_INFOROM_VERSION_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_DEVICE_MIG_DISABLE", "vllm.third_party.pynvml.NVML_DEVICE_MIG_ENABLE", "vllm.third_party.pynvml.NVML_DEVICE_NAME_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_DEVICE_NAME_V2_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_DEVICE_PART_NUMBER_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_DEVICE_PCI_BUS_ID_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_DEVICE_PCI_BUS_ID_BUFFER_V2_SIZE", "vllm.third_party.pynvml.NVML_DEVICE_PCI_BUS_ID_FMT", "vllm.third_party.pynvml.NVML_DEVICE_PCI_BUS_ID_LEGACY_FMT", "vllm.third_party.pynvml.NVML_DEVICE_SERIAL_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_DEVICE_UUID_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_DEVICE_UUID_V2_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_DEVICE_VBIOS_VERSION_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_COMPUTE_MEDIA_ENGINE_GPU", "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_COUNT", "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_DEVICE_STREAMING", "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_FRACTIONAL_MULTI_VGPU", "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_HETEROGENEOUS_TIMESLICE_PROFILES", "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_HETEROGENEOUS_TIMESLICE_SIZES", "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_HOMOGENEOUS_PLACEMENTS", "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_MINI_QUARTER_GPU", "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_READ_DEVICE_BUFFER_BW", "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_WARM_UPDATE", "vllm.third_party.pynvml.NVML_DEVICE_VGPU_CAP_WRITE_DEVICE_BUFFER_BW", "vllm.third_party.pynvml.NVML_DEV_CAP_EGM", "vllm.third_party.pynvml.NVML_DOUBLE_BIT_ECC", "vllm.third_party.pynvml.NVML_DRIVER_MCDM", "vllm.third_party.pynvml.NVML_DRIVER_WDDM", "vllm.third_party.pynvml.NVML_DRIVER_WDM", "vllm.third_party.pynvml.NVML_ECC_COUNTER_TYPE_COUNT", "vllm.third_party.pynvml.NVML_ECC_ERROR_TYPE_COUNT", "vllm.third_party.pynvml.NVML_ENCODER_QUERY_AV1", "vllm.third_party.pynvml.NVML_ENCODER_QUERY_H264", "vllm.third_party.pynvml.NVML_ENCODER_QUERY_HEVC", "vllm.third_party.pynvml.NVML_ENCODER_QUERY_UNKNOWN", "vllm.third_party.pynvml.NVML_ENC_UTILIZATION_SAMPLES", "vllm.third_party.pynvml.NVML_ERROR_ALREADY_INITIALIZED", "vllm.third_party.pynvml.NVML_ERROR_ARGUMENT_VERSION_MISMATCH", "vllm.third_party.pynvml.NVML_ERROR_CORRUPTED_INFOROM", "vllm.third_party.pynvml.NVML_ERROR_DEPRECATED", "vllm.third_party.pynvml.NVML_ERROR_DRIVER_NOT_LOADED", "vllm.third_party.pynvml.NVML_ERROR_FREQ_NOT_SUPPORTED", "vllm.third_party.pynvml.NVML_ERROR_FUNCTION_NOT_FOUND", "vllm.third_party.pynvml.NVML_ERROR_GPU_IS_LOST", "vllm.third_party.pynvml.NVML_ERROR_GPU_NOT_FOUND", "vllm.third_party.pynvml.NVML_ERROR_INSUFFICIENT_POWER", "vllm.third_party.pynvml.NVML_ERROR_INSUFFICIENT_RESOURCES", "vllm.third_party.pynvml.NVML_ERROR_INSUFFICIENT_SIZE", "vllm.third_party.pynvml.NVML_ERROR_INVALID_ARGUMENT", "vllm.third_party.pynvml.NVML_ERROR_INVALID_STATE", "vllm.third_party.pynvml.NVML_ERROR_IN_USE", "vllm.third_party.pynvml.NVML_ERROR_IRQ_ISSUE", "vllm.third_party.pynvml.NVML_ERROR_LIBRARY_NOT_FOUND", "vllm.third_party.pynvml.NVML_ERROR_LIB_RM_VERSION_MISMATCH", "vllm.third_party.pynvml.NVML_ERROR_MEMORY", "vllm.third_party.pynvml.NVML_ERROR_NOT_FOUND", "vllm.third_party.pynvml.NVML_ERROR_NOT_READY", "vllm.third_party.pynvml.NVML_ERROR_NOT_SUPPORTED", "vllm.third_party.pynvml.NVML_ERROR_NO_DATA", "vllm.third_party.pynvml.NVML_ERROR_NO_PERMISSION", "vllm.third_party.pynvml.NVML_ERROR_OPERATING_SYSTEM", "vllm.third_party.pynvml.NVML_ERROR_RESET_REQUIRED", "vllm.third_party.pynvml.NVML_ERROR_TIMEOUT", "vllm.third_party.pynvml.NVML_ERROR_UNINITIALIZED", "vllm.third_party.pynvml.NVML_ERROR_UNKNOWN", "vllm.third_party.pynvml.NVML_ERROR_VGPU_ECC_NOT_SUPPORTED", "vllm.third_party.pynvml.NVML_FAN_FAILED", "vllm.third_party.pynvml.NVML_FAN_NORMAL", "vllm.third_party.pynvml.NVML_FAN_POLICY_MANUAL", "vllm.third_party.pynvml.NVML_FAN_POLICY_TEMPERATURE_CONTINOUS_SW", "vllm.third_party.pynvml.NVML_FBC_SESSION_TYPE_CUDA", "vllm.third_party.pynvml.NVML_FBC_SESSION_TYPE_HWENC", "vllm.third_party.pynvml.NVML_FBC_SESSION_TYPE_TOSYS", "vllm.third_party.pynvml.NVML_FBC_SESSION_TYPE_UNKNOWN", "vllm.third_party.pynvml.NVML_FBC_SESSION_TYPE_VID", "vllm.third_party.pynvml.NVML_FEATURE_DISABLED", "vllm.third_party.pynvml.NVML_FEATURE_ENABLED", "vllm.third_party.pynvml.NVML_FI_DEV_C2C_LINK_COUNT", "vllm.third_party.pynvml.NVML_FI_DEV_C2C_LINK_GET_MAX_BW", "vllm.third_party.pynvml.NVML_FI_DEV_C2C_LINK_GET_STATUS", "vllm.third_party.pynvml.NVML_FI_DEV_DRAIN_AND_RESET_STATUS", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_CURRENT", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_AGG_CBU", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_AGG_DEV", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_AGG_L1", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_AGG_L2", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_AGG_REG", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_AGG_TEX", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_AGG_TOTAL", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_VOL_CBU", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_VOL_DEV", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_VOL_L1", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_VOL_L2", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_VOL_REG", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_VOL_TEX", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_DBE_VOL_TOTAL", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_PENDING", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_AGG_DEV", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_AGG_L1", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_AGG_L2", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_AGG_REG", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_AGG_TEX", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_AGG_TOTAL", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_VOL_DEV", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_VOL_L1", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_VOL_L2", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_VOL_REG", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_VOL_TEX", "vllm.third_party.pynvml.NVML_FI_DEV_ECC_SBE_VOL_TOTAL", "vllm.third_party.pynvml.NVML_FI_DEV_ENERGY", "vllm.third_party.pynvml.NVML_FI_DEV_GET_GPU_RECOVERY_ACTION", "vllm.third_party.pynvml.NVML_FI_DEV_IS_MIG_MODE_INDEPENDENT_MIG_QUERY_CAPABLE", "vllm.third_party.pynvml.NVML_FI_DEV_IS_RESETLESS_MIG_SUPPORTED", "vllm.third_party.pynvml.NVML_FI_DEV_MEMORY_TEMP", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L0", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L1", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L10", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L11", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L2", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L3", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L4", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L5", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L6", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L7", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L8", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_L9", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C0_TOTAL", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L0", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L1", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L10", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L11", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L2", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L3", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L4", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L5", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L6", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L7", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L8", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_L9", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_BANDWIDTH_C1_TOTAL", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_BUFFER_OVERRUN_ERRORS", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_EFFECTIVE_BER", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_EFFECTIVE_ERRORS", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_0", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_1", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_10", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_11", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_12", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_13", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_14", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_15", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_2", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_3", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_4", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_5", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_6", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_7", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_8", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_FEC_HISTORY_9", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_LINK_RECOVERY_EVENTS", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_LINK_RECOVERY_FAILED_EVENTS", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_LINK_RECOVERY_SUCCESSFUL_EVENTS", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_LOCAL_LINK_INTEGRITY_ERRORS", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_MALFORMED_PACKET_ERRORS", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RAW_BER", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RAW_BER_LANE0", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RAW_BER_LANE1", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RCV_BYTES", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RCV_ERRORS", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RCV_GENERAL_ERRORS", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RCV_PACKETS", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_RCV_REMOTE_ERRORS", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_SYMBOL_BER", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_SYMBOL_ERRORS", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_VL15_DROPPED", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_XMIT_BYTES", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_XMIT_DISCARDS", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_COUNT_XMIT_PACKETS", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L0", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L1", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L10", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L11", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L2", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L3", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L4", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L5", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L6", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L7", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L8", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_L9", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_DATA_ERROR_COUNT_TOTAL", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L0", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L1", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L10", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L11", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L2", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L3", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L4", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L5", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L6", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L7", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L8", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_L9", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_CRC_FLIT_ERROR_COUNT_TOTAL", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L0", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L1", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L10", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L11", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L2", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L3", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L4", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L5", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L6", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L7", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L8", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_L9", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ECC_DATA_ERROR_COUNT_TOTAL", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ERROR_DL_CRC", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ERROR_DL_RECOVERY", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_ERROR_DL_REPLAY", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_POWER_STATE", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_POWER_THRESHOLD", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_POWER_THRESHOLD_MAX", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_POWER_THRESHOLD_MIN", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_POWER_THRESHOLD_SUPPORTED", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_POWER_THRESHOLD_UNITS", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_SPEED", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_STATE", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_GET_VERSION", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_LINK_COUNT", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L0", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L1", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L10", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L11", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L2", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L3", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L4", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L5", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L6", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L7", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L8", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_L9", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_RECOVERY_ERROR_COUNT_TOTAL", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REMOTE_NVLINK_ID", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L0", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L1", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L10", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L11", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L2", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L3", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L4", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L5", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L6", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L7", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L8", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_L9", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_REPLAY_ERROR_COUNT_TOTAL", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_COMMON", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L0", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L1", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L10", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L11", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L2", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L3", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L4", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L5", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L6", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L7", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L8", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_SPEED_MBPS_L9", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_THROUGHPUT_DATA_RX", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_THROUGHPUT_DATA_TX", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_THROUGHPUT_RAW_RX", "vllm.third_party.pynvml.NVML_FI_DEV_NVLINK_THROUGHPUT_RAW_TX", "vllm.third_party.pynvml.NVML_FI_DEV_NVSWITCH_CONNECTED_LINK_COUNT", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_BAD_DLLP", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_BAD_TLP", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_CORRECTABLE_ERRORS", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_FATAL_ERROR", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_LANE_ERROR", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_LCRC_ERROR", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_NAKS_RECEIVED", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_NAKS_SENT", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_NON_FATAL_ERROR", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_RECEIVER_ERROR", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_RX_BYTES", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_TX_BYTES", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_COUNT_UNSUPPORTED_REQ", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_INBOUND_ATOMICS_MASK", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_L0_TO_RECOVERY_COUNTER", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_OUTBOUND_ATOMICS_MASK", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_REPLAY_COUNTER", "vllm.third_party.pynvml.NVML_FI_DEV_PCIE_REPLAY_ROLLOVER_COUNTER", "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_BOARD_LIMIT", "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_LOW_UTILIZATION", "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_POWER", "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_RELIABILITY", "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_SYNC_BOOST", "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_THERMAL", "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_TOTAL_APP_CLOCKS", "vllm.third_party.pynvml.NVML_FI_DEV_PERF_POLICY_TOTAL_BASE_CLOCKS", "vllm.third_party.pynvml.NVML_FI_DEV_POWER_AVERAGE", "vllm.third_party.pynvml.NVML_FI_DEV_POWER_CURRENT_LIMIT", "vllm.third_party.pynvml.NVML_FI_DEV_POWER_DEFAULT_LIMIT", "vllm.third_party.pynvml.NVML_FI_DEV_POWER_INSTANT", "vllm.third_party.pynvml.NVML_FI_DEV_POWER_MAX_LIMIT", "vllm.third_party.pynvml.NVML_FI_DEV_POWER_MIN_LIMIT", "vllm.third_party.pynvml.NVML_FI_DEV_POWER_REQUESTED_LIMIT", "vllm.third_party.pynvml.NVML_FI_DEV_REMAPPED_COR", "vllm.third_party.pynvml.NVML_FI_DEV_REMAPPED_FAILURE", "vllm.third_party.pynvml.NVML_FI_DEV_REMAPPED_PENDING", "vllm.third_party.pynvml.NVML_FI_DEV_REMAPPED_UNC", "vllm.third_party.pynvml.NVML_FI_DEV_RESET_STATUS", "vllm.third_party.pynvml.NVML_FI_DEV_RETIRED_DBE", "vllm.third_party.pynvml.NVML_FI_DEV_RETIRED_PENDING", "vllm.third_party.pynvml.NVML_FI_DEV_RETIRED_PENDING_DBE", "vllm.third_party.pynvml.NVML_FI_DEV_RETIRED_PENDING_SBE", "vllm.third_party.pynvml.NVML_FI_DEV_RETIRED_SBE", "vllm.third_party.pynvml.NVML_FI_DEV_TEMPERATURE_GPU_MAX_TLIMIT", "vllm.third_party.pynvml.NVML_FI_DEV_TEMPERATURE_MEM_MAX_TLIMIT", "vllm.third_party.pynvml.NVML_FI_DEV_TEMPERATURE_SHUTDOWN_TLIMIT", "vllm.third_party.pynvml.NVML_FI_DEV_TEMPERATURE_SLOWDOWN_TLIMIT", "vllm.third_party.pynvml.NVML_FI_DEV_TOTAL_ENERGY_CONSUMPTION", "vllm.third_party.pynvml.NVML_FI_MAX", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_ACTIVE_PRESET_PROFILE", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_ADMIN_OVERRIDE_PERCENT_TMP_FLOOR", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_ADMIN_OVERRIDE_RAMP_DOWN_HYST_VAL", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_ADMIN_OVERRIDE_RAMP_DOWN_RATE", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_ADMIN_OVERRIDE_RAMP_UP_RATE", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_APPLIED_TMP_CEIL", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_APPLIED_TMP_FLOOR", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_ENABLED", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_HW_CIRCUITRY_PERCENT_LIFETIME_REMAINING", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_IMM_RAMP_DOWN_ENABLED", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_MAX_NUM_PRESET_PROFILES", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_MAX_PERCENT_TMP_FLOOR_SETTING", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_MIN_PERCENT_TMP_FLOOR_SETTING", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_PRIV_LVL", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_PROFILE_PERCENT_TMP_FLOOR", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_PROFILE_RAMP_DOWN_HYST_VAL", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_PROFILE_RAMP_DOWN_RATE", "vllm.third_party.pynvml.NVML_FI_PWR_SMOOTHING_PROFILE_RAMP_UP_RATE", "vllm.third_party.pynvml.NVML_GOM_ALL_ON", "vllm.third_party.pynvml.NVML_GOM_COMPUTE", "vllm.third_party.pynvml.NVML_GOM_LOW_DP", "vllm.third_party.pynvml.NVML_GPM_METRICS_GET_VERSION", "vllm.third_party.pynvml.NVML_GPM_METRIC_ANY_TENSOR_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_DFMA_TENSOR_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_DRAM_BW_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_FP16_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_FP32_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_FP64_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_GRAPHICS_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_HMMA_TENSOR_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_IMMA_TENSOR_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_INTEGER_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_MAX", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_0_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_1_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_2_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_3_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_4_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_5_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_6_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVDEC_7_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_0_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_1_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_2_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_3_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_4_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_5_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_6_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVJPG_7_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L0_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L0_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L10_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L10_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L11_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L11_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L12_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L12_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L13_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L13_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L14_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L14_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L15_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L15_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L16_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L16_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L17_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L17_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L1_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L1_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L2_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L2_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L3_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L3_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L4_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L4_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L5_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L5_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L6_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L6_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L7_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L7_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L8_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L8_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L9_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_L9_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_TOTAL_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVLINK_TOTAL_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVOFA_0_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_NVOFA_1_UTIL", "vllm.third_party.pynvml.NVML_GPM_METRIC_PCIE_RX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_PCIE_TX_PER_SEC", "vllm.third_party.pynvml.NVML_GPM_METRIC_SM_OCCUPANCY", "vllm.third_party.pynvml.NVML_GPM_METRIC_SM_UTIL", "vllm.third_party.pynvml.NVML_GPM_SUPPORT_VERSION", "vllm.third_party.pynvml.NVML_GPU_ATTESTATION_CERT_CHAIN_SIZE", "vllm.third_party.pynvml.NVML_GPU_CERT_CHAIN_SIZE", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ACCESS_TIMEOUT_RECOVERY_FALSE", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ACCESS_TIMEOUT_RECOVERY_NOT_SUPPORTED", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ACCESS_TIMEOUT_RECOVERY_TRUE", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_DEGRADED_BW_FALSE", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_DEGRADED_BW_NOT_SUPPORTED", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_DEGRADED_BW_TRUE", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ROUTE_RECOVERY_FALSE", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ROUTE_RECOVERY_NOT_SUPPORTED", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ROUTE_RECOVERY_TRUE", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ROUTE_UNHEALTHY_FALSE", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ROUTE_UNHEALTHY_NOT_SUPPORTED", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_ROUTE_UNHEALTHY_TRUE", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_SHIFT_ACCESS_TIMEOUT_RECOVERY", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_SHIFT_DEGRADED_BW", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_SHIFT_ROUTE_RECOVERY", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_SHIFT_ROUTE_UNHEALTHY", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_WIDTH_ACCESS_TIMEOUT_RECOVERY", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_WIDTH_DEGRADED_BW", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_WIDTH_ROUTE_RECOVERY", "vllm.third_party.pynvml.NVML_GPU_FABRIC_HEALTH_MASK_WIDTH_ROUTE_UNHEALTHY", "vllm.third_party.pynvml.NVML_GPU_FABRIC_STATE_COMPLETED", "vllm.third_party.pynvml.NVML_GPU_FABRIC_STATE_IN_PROGRESS", "vllm.third_party.pynvml.NVML_GPU_FABRIC_STATE_NOT_STARTED", "vllm.third_party.pynvml.NVML_GPU_FABRIC_STATE_NOT_SUPPORTED", "vllm.third_party.pynvml.NVML_GPU_FABRIC_UUID_LEN", "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_1_SLICE", "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_1_SLICE_GFX", "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_1_SLICE_REV1", "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_1_SLICE_REV2", "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_2_SLICE", "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_2_SLICE_GFX", "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_2_SLICE_REV1", "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_3_SLICE", "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_4_SLICE", "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_4_SLICE_GFX", "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_6_SLICE", "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_7_SLICE", "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_8_SLICE", "vllm.third_party.pynvml.NVML_GPU_INSTANCE_PROFILE_COUNT", "vllm.third_party.pynvml.NVML_GPU_NVLINK_BW_MODE_3QUARTER", "vllm.third_party.pynvml.NVML_GPU_NVLINK_BW_MODE_COUNT", "vllm.third_party.pynvml.NVML_GPU_NVLINK_BW_MODE_FULL", "vllm.third_party.pynvml.NVML_GPU_NVLINK_BW_MODE_HALF", "vllm.third_party.pynvml.NVML_GPU_NVLINK_BW_MODE_MIN", "vllm.third_party.pynvml.NVML_GPU_NVLINK_BW_MODE_OFF", "vllm.third_party.pynvml.NVML_GPU_RECOVERY_ACTION_DRAIN_AND_RESET", "vllm.third_party.pynvml.NVML_GPU_RECOVERY_ACTION_DRAIN_P2P", "vllm.third_party.pynvml.NVML_GPU_RECOVERY_ACTION_GPU_RESET", "vllm.third_party.pynvml.NVML_GPU_RECOVERY_ACTION_NODE_REBOOT", "vllm.third_party.pynvml.NVML_GPU_RECOVERY_ACTION_NONE", "vllm.third_party.pynvml.NVML_GPU_UTILIZATION_DOMAIN_BUS", "vllm.third_party.pynvml.NVML_GPU_UTILIZATION_DOMAIN_FB", "vllm.third_party.pynvml.NVML_GPU_UTILIZATION_DOMAIN_GPU", "vllm.third_party.pynvml.NVML_GPU_UTILIZATION_DOMAIN_VID", "vllm.third_party.pynvml.NVML_GPU_UTILIZATION_SAMPLES", "vllm.third_party.pynvml.NVML_GPU_VIRTUALIZATION_MODE_HOST_VGPU", "vllm.third_party.pynvml.NVML_GPU_VIRTUALIZATION_MODE_HOST_VSGA", "vllm.third_party.pynvml.NVML_GPU_VIRTUALIZATION_MODE_NONE", "vllm.third_party.pynvml.NVML_GPU_VIRTUALIZATION_MODE_PASSTHROUGH", "vllm.third_party.pynvml.NVML_GPU_VIRTUALIZATION_MODE_VGPU", "vllm.third_party.pynvml.NVML_GRID_LICENSE_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_GRID_LICENSE_EXPIRY_INVALID", "vllm.third_party.pynvml.NVML_GRID_LICENSE_EXPIRY_NOT_APPLICABLE", "vllm.third_party.pynvml.NVML_GRID_LICENSE_EXPIRY_NOT_AVAILABLE", "vllm.third_party.pynvml.NVML_GRID_LICENSE_EXPIRY_PERMANENT", "vllm.third_party.pynvml.NVML_GRID_LICENSE_EXPIRY_VALID", "vllm.third_party.pynvml.NVML_GRID_LICENSE_FEATURE_CODE_COMPUTE", "vllm.third_party.pynvml.NVML_GRID_LICENSE_FEATURE_CODE_GAMING", "vllm.third_party.pynvml.NVML_GRID_LICENSE_FEATURE_CODE_NVIDIA_RTX", "vllm.third_party.pynvml.NVML_GRID_LICENSE_FEATURE_CODE_UNKNOWN", "vllm.third_party.pynvml.NVML_GRID_LICENSE_FEATURE_CODE_VGPU", "vllm.third_party.pynvml.NVML_GRID_LICENSE_FEATURE_CODE_VWORKSTATION", "vllm.third_party.pynvml.NVML_GRID_LICENSE_FEATURE_MAX_COUNT", "vllm.third_party.pynvml.NVML_GRID_LICENSE_STATE_LICENSED", "vllm.third_party.pynvml.NVML_GRID_LICENSE_STATE_UNINITIALIZED", "vllm.third_party.pynvml.NVML_GRID_LICENSE_STATE_UNKNOWN", "vllm.third_party.pynvml.NVML_GRID_LICENSE_STATE_UNLICENSED", "vllm.third_party.pynvml.NVML_GRID_LICENSE_STATE_UNLICENSED_RESTRICTED", "vllm.third_party.pynvml.NVML_GRID_LICENSE_STATE_UNLICENSED_UNRESTRICTED", "vllm.third_party.pynvml.NVML_GSP_FIRMWARE_VERSION_BUF_SIZE", "vllm.third_party.pynvml.NVML_HOST_VGPU_MODE_NON_SRIOV", "vllm.third_party.pynvml.NVML_HOST_VGPU_MODE_SRIOV", "vllm.third_party.pynvml.NVML_INFOROM_COUNT", "vllm.third_party.pynvml.NVML_INFOROM_DEN", "vllm.third_party.pynvml.NVML_INFOROM_ECC", "vllm.third_party.pynvml.NVML_INFOROM_OEM", "vllm.third_party.pynvml.NVML_INFOROM_POWER", "vllm.third_party.pynvml.NVML_INIT_FLAG_NO_ATTACH", "vllm.third_party.pynvml.NVML_INIT_FLAG_NO_GPUS", "vllm.third_party.pynvml.NVML_JPG_UTILIZATION_SAMPLES", "vllm.third_party.pynvml.NVML_LED_COLOR_AMBER", "vllm.third_party.pynvml.NVML_LED_COLOR_GREEN", "vllm.third_party.pynvml.NVML_MAX_GPC_COUNT", "vllm.third_party.pynvml.NVML_MAX_GPU_PERF_PSTATES", "vllm.third_party.pynvml.NVML_MAX_GPU_UTILIZATIONS", "vllm.third_party.pynvml.NVML_MAX_PHYSICAL_BRIDGE", "vllm.third_party.pynvml.NVML_MAX_THERMAL_SENSORS_PER_GPU", "vllm.third_party.pynvml.NVML_MEMORY_CLK_SAMPLES", "vllm.third_party.pynvml.NVML_MEMORY_ERROR_TYPE_CORRECTED", "vllm.third_party.pynvml.NVML_MEMORY_ERROR_TYPE_COUNT", "vllm.third_party.pynvml.NVML_MEMORY_ERROR_TYPE_UNCORRECTED", "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_CBU", "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_COUNT", "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_DEVICE_MEMORY", "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_DRAM", "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_L1_CACHE", "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_L2_CACHE", "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_REGISTER_FILE", "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_SRAM", "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_TEXTURE_MEMORY", "vllm.third_party.pynvml.NVML_MEMORY_LOCATION_TEXTURE_SHM", "vllm.third_party.pynvml.NVML_MEMORY_UTILIZATION_SAMPLES", "vllm.third_party.pynvml.NVML_MODULE_POWER_SAMPLES", "vllm.third_party.pynvml.NVML_NVLINK_CAP_COUNT", "vllm.third_party.pynvml.NVML_NVLINK_CAP_P2P_ATOMICS", "vllm.third_party.pynvml.NVML_NVLINK_CAP_P2P_SUPPORTED", "vllm.third_party.pynvml.NVML_NVLINK_CAP_SLI_BRIDGE", "vllm.third_party.pynvml.NVML_NVLINK_CAP_SYSMEM_ACCESS", "vllm.third_party.pynvml.NVML_NVLINK_CAP_SYSMEM_ATOMICS", "vllm.third_party.pynvml.NVML_NVLINK_CAP_VALID", "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_ALL", "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_FLUSH", "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_NOP", "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_NRATOM", "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_RATOM", "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_READ", "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_RESPDATA", "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_RESPNODATA", "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_PKTFILTER_WRITE", "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_UNIT_BYTES", "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_UNIT_COUNT", "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_UNIT_CYCLES", "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_UNIT_PACKETS", "vllm.third_party.pynvml.NVML_NVLINK_COUNTER_UNIT_RESERVED", "vllm.third_party.pynvml.NVML_NVLINK_DEVICE_TYPE_GPU", "vllm.third_party.pynvml.NVML_NVLINK_DEVICE_TYPE_IBMNPU", "vllm.third_party.pynvml.NVML_NVLINK_DEVICE_TYPE_SWITCH", "vllm.third_party.pynvml.NVML_NVLINK_DEVICE_TYPE_UNKNOWN", "vllm.third_party.pynvml.NVML_NVLINK_ERROR_COUNT", "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_CRC_DATA", "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_CRC_FLIT", "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_ECC_COUNT", "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_ECC_DATA", "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_ECC_LANE0", "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_ECC_LANE1", "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_ECC_LANE2", "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_ECC_LANE3", "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_RECOVERY", "vllm.third_party.pynvml.NVML_NVLINK_ERROR_DL_REPLAY", "vllm.third_party.pynvml.NVML_NVLINK_LOW_POWER_THRESHOLD_MAX", "vllm.third_party.pynvml.NVML_NVLINK_LOW_POWER_THRESHOLD_MIN", "vllm.third_party.pynvml.NVML_NVLINK_LOW_POWER_THRESHOLD_RESET", "vllm.third_party.pynvml.NVML_NVLINK_LOW_POWER_THRESHOLD_UNIT_100US", "vllm.third_party.pynvml.NVML_NVLINK_LOW_POWER_THRESHOLD_UNIT_50US", "vllm.third_party.pynvml.NVML_NVLINK_MAX_LINKS", "vllm.third_party.pynvml.NVML_NVLINK_POWER_STATE_HIGH_SPEED", "vllm.third_party.pynvml.NVML_NVLINK_POWER_STATE_LOW", "vllm.third_party.pynvml.NVML_NVLINK_STATE_ACTIVE", "vllm.third_party.pynvml.NVML_NVLINK_STATE_INACTIVE", "vllm.third_party.pynvml.NVML_NVLINK_STATE_SLEEP", "vllm.third_party.pynvml.NVML_NVLINK_TOTAL_SUPPORTED_BW_MODES", "vllm.third_party.pynvml.NVML_NVLINK_VERSION_1_0", "vllm.third_party.pynvml.NVML_NVLINK_VERSION_2_0", "vllm.third_party.pynvml.NVML_NVLINK_VERSION_2_2", "vllm.third_party.pynvml.NVML_NVLINK_VERSION_3_0", "vllm.third_party.pynvml.NVML_NVLINK_VERSION_3_1", "vllm.third_party.pynvml.NVML_NVLINK_VERSION_4_0", "vllm.third_party.pynvml.NVML_NVLINK_VERSION_5_0", "vllm.third_party.pynvml.NVML_NVLINK_VERSION_INVALID", "vllm.third_party.pynvml.NVML_OFA_UTILIZATION_SAMPLES", "vllm.third_party.pynvml.NVML_P2P_CAPS_INDEX_ATOMICS", "vllm.third_party.pynvml.NVML_P2P_CAPS_INDEX_NVLINK", "vllm.third_party.pynvml.NVML_P2P_CAPS_INDEX_PCI", "vllm.third_party.pynvml.NVML_P2P_CAPS_INDEX_PROP", "vllm.third_party.pynvml.NVML_P2P_CAPS_INDEX_READ", "vllm.third_party.pynvml.NVML_P2P_CAPS_INDEX_UNKNOWN", "vllm.third_party.pynvml.NVML_P2P_CAPS_INDEX_WRITE", "vllm.third_party.pynvml.NVML_P2P_STATUS_CHIPSET_NOT_SUPPORED", "vllm.third_party.pynvml.NVML_P2P_STATUS_DISABLED_BY_REGKEY", "vllm.third_party.pynvml.NVML_P2P_STATUS_GPU_NOT_SUPPORTED", "vllm.third_party.pynvml.NVML_P2P_STATUS_IOH_TOPOLOGY_NOT_SUPPORTED", "vllm.third_party.pynvml.NVML_P2P_STATUS_NOT_SUPPORTED", "vllm.third_party.pynvml.NVML_P2P_STATUS_OK", "vllm.third_party.pynvml.NVML_P2P_STATUS_UNKNOWN", "vllm.third_party.pynvml.NVML_PAGE_RETIREMENT_CAUSE_COUNT", "vllm.third_party.pynvml.NVML_PAGE_RETIREMENT_CAUSE_DOUBLE_BIT_ECC_ERROR", "vllm.third_party.pynvml.NVML_PAGE_RETIREMENT_CAUSE_MULTIPLE_SINGLE_BIT_ECC_ERRORS", "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_CAP_CAS128", "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_CAP_CAS32", "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_CAP_CAS64", "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_CAP_FETCHADD32", "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_CAP_FETCHADD64", "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_CAP_SWAP32", "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_CAP_SWAP64", "vllm.third_party.pynvml.NVML_PCIE_ATOMICS_OPS_MAX", "vllm.third_party.pynvml.NVML_PCIE_LINK_KEEP", "vllm.third_party.pynvml.NVML_PCIE_LINK_MAX_SPEED_16000MBPS", "vllm.third_party.pynvml.NVML_PCIE_LINK_MAX_SPEED_2500MBPS", "vllm.third_party.pynvml.NVML_PCIE_LINK_MAX_SPEED_32000MBPS", "vllm.third_party.pynvml.NVML_PCIE_LINK_MAX_SPEED_5000MBPS", "vllm.third_party.pynvml.NVML_PCIE_LINK_MAX_SPEED_64000MBPS", "vllm.third_party.pynvml.NVML_PCIE_LINK_MAX_SPEED_8000MBPS", "vllm.third_party.pynvml.NVML_PCIE_LINK_MAX_SPEED_INVALID", "vllm.third_party.pynvml.NVML_PCIE_LINK_SHUT_DOWN", "vllm.third_party.pynvml.NVML_PCIE_UTIL_COUNT", "vllm.third_party.pynvml.NVML_PCIE_UTIL_RX_BYTES", "vllm.third_party.pynvml.NVML_PCIE_UTIL_TX_BYTES", "vllm.third_party.pynvml.NVML_PERF_MODES_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_PERF_POLICY_BOARD_LIMIT", "vllm.third_party.pynvml.NVML_PERF_POLICY_COUNT", "vllm.third_party.pynvml.NVML_PERF_POLICY_LOW_UTILIZATION", "vllm.third_party.pynvml.NVML_PERF_POLICY_POWER", "vllm.third_party.pynvml.NVML_PERF_POLICY_RELIABILITY", "vllm.third_party.pynvml.NVML_PERF_POLICY_SYNC_BOOST", "vllm.third_party.pynvml.NVML_PERF_POLICY_THERMAL", "vllm.third_party.pynvml.NVML_PERF_POLICY_TOTAL_APP_CLOCKS", "vllm.third_party.pynvml.NVML_PERF_POLICY_TOTAL_BASE_CLOCKS", "vllm.third_party.pynvml.NVML_POWER_PROFILE_BALANCED", "vllm.third_party.pynvml.NVML_POWER_PROFILE_COMPUTE", "vllm.third_party.pynvml.NVML_POWER_PROFILE_DCPCIE", "vllm.third_party.pynvml.NVML_POWER_PROFILE_HMMA_DENSE", "vllm.third_party.pynvml.NVML_POWER_PROFILE_HMMA_SPARSE", "vllm.third_party.pynvml.NVML_POWER_PROFILE_HPC", "vllm.third_party.pynvml.NVML_POWER_PROFILE_LLM_INFERENCE", "vllm.third_party.pynvml.NVML_POWER_PROFILE_LLM_TRAINING", "vllm.third_party.pynvml.NVML_POWER_PROFILE_MAX", "vllm.third_party.pynvml.NVML_POWER_PROFILE_MAX_P", "vllm.third_party.pynvml.NVML_POWER_PROFILE_MAX_Q", "vllm.third_party.pynvml.NVML_POWER_PROFILE_MEMORY_BOUND", "vllm.third_party.pynvml.NVML_POWER_PROFILE_MIG", "vllm.third_party.pynvml.NVML_POWER_PROFILE_NETWORK", "vllm.third_party.pynvml.NVML_POWER_PROFILE_RBM", "vllm.third_party.pynvml.NVML_POWER_PROFILE_SYNC_BALANCED", "vllm.third_party.pynvml.NVML_POWER_SCOPE_GPU", "vllm.third_party.pynvml.NVML_POWER_SCOPE_MEMORY", "vllm.third_party.pynvml.NVML_POWER_SCOPE_MODULE", "vllm.third_party.pynvml.NVML_POWER_SMOOTHING_ADMIN_OVERRIDE_NOT_SET", "vllm.third_party.pynvml.NVML_POWER_SMOOTHING_MAX_NUM_PROFILES", "vllm.third_party.pynvml.NVML_POWER_SMOOTHING_PROFILE_PARAM_PERCENT_TMP_FLOOR", "vllm.third_party.pynvml.NVML_POWER_SMOOTHING_PROFILE_PARAM_RAMP_DOWN_HYSTERESIS", "vllm.third_party.pynvml.NVML_POWER_SMOOTHING_PROFILE_PARAM_RAMP_DOWN_RATE", "vllm.third_party.pynvml.NVML_POWER_SMOOTHING_PROFILE_PARAM_RAMP_UP_RATE", "vllm.third_party.pynvml.NVML_POWER_SOURCE_AC", "vllm.third_party.pynvml.NVML_POWER_SOURCE_BATTERY", "vllm.third_party.pynvml.NVML_POWER_SOURCE_UNDERSIZED", "vllm.third_party.pynvml.NVML_PROCESSOR_CLK_SAMPLES", "vllm.third_party.pynvml.NVML_PROCESS_MODE_COMPUTE", "vllm.third_party.pynvml.NVML_PROCESS_MODE_GRAPHICS", "vllm.third_party.pynvml.NVML_PROCESS_MODE_MPS", "vllm.third_party.pynvml.NVML_PSTATE_0", "vllm.third_party.pynvml.NVML_PSTATE_1", "vllm.third_party.pynvml.NVML_PSTATE_10", "vllm.third_party.pynvml.NVML_PSTATE_11", "vllm.third_party.pynvml.NVML_PSTATE_12", "vllm.third_party.pynvml.NVML_PSTATE_13", "vllm.third_party.pynvml.NVML_PSTATE_14", "vllm.third_party.pynvml.NVML_PSTATE_15", "vllm.third_party.pynvml.NVML_PSTATE_2", "vllm.third_party.pynvml.NVML_PSTATE_3", "vllm.third_party.pynvml.NVML_PSTATE_4", "vllm.third_party.pynvml.NVML_PSTATE_5", "vllm.third_party.pynvml.NVML_PSTATE_6", "vllm.third_party.pynvml.NVML_PSTATE_7", "vllm.third_party.pynvml.NVML_PSTATE_8", "vllm.third_party.pynvml.NVML_PSTATE_9", "vllm.third_party.pynvml.NVML_PSTATE_UNKNOWN", "vllm.third_party.pynvml.NVML_RESTRICTED_API_COUNT", "vllm.third_party.pynvml.NVML_RESTRICTED_API_SET_APPLICATION_CLOCKS", "vllm.third_party.pynvml.NVML_RESTRICTED_API_SET_AUTO_BOOSTED_CLOCKS", "vllm.third_party.pynvml.NVML_SAMPLINGTYPE_COUNT", "vllm.third_party.pynvml.NVML_SCHEDULER_SW_MAX_LOG_ENTRIES", "vllm.third_party.pynvml.NVML_SINGLE_BIT_ECC", "vllm.third_party.pynvml.NVML_SUCCESS", "vllm.third_party.pynvml.NVML_SUPPORTED_VGPU_SCHEDULER_POLICY_COUNT", "vllm.third_party.pynvml.NVML_SYSTEM_DRIVER_VERSION_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_SYSTEM_NVML_VERSION_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_TEMPERATURE_COUNT", "vllm.third_party.pynvml.NVML_TEMPERATURE_GPU", "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_ACOUSTIC_CURR", "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_ACOUSTIC_MAX", "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_ACOUSTIC_MIN", "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_COUNT", "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_GPS_CURR", "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_GPU_MAX", "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_MEM_MAX", "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_SHUTDOWN", "vllm.third_party.pynvml.NVML_TEMPERATURE_THRESHOLD_SLOWDOWN", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_ADM1032", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_ADT7461", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_ADT7473", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_ADT7473S", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_G781", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_GPU_INTERNAL", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_LM64", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_LM89", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_LM99", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_MAX1617", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_MAX6649", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_MAX6649R", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_NONE", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_NVSYSCON_CANOAS", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_NVSYSCON_E551", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_OS", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_SBMAX6649", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_UNKNOWN", "vllm.third_party.pynvml.NVML_THERMAL_CONTROLLER_VBIOSEVT", "vllm.third_party.pynvml.NVML_THERMAL_COOLER_SIGNAL_COUNT", "vllm.third_party.pynvml.NVML_THERMAL_COOLER_SIGNAL_NONE", "vllm.third_party.pynvml.NVML_THERMAL_COOLER_SIGNAL_TOGGLE", "vllm.third_party.pynvml.NVML_THERMAL_COOLER_SIGNAL_VARIABLE", "vllm.third_party.pynvml.NVML_THERMAL_COOLER_TARGET_GPU", "vllm.third_party.pynvml.NVML_THERMAL_COOLER_TARGET_GPU_RELATED", "vllm.third_party.pynvml.NVML_THERMAL_COOLER_TARGET_MEMORY", "vllm.third_party.pynvml.NVML_THERMAL_COOLER_TARGET_NONE", "vllm.third_party.pynvml.NVML_THERMAL_COOLER_TARGET_POWER_SUPPLY", "vllm.third_party.pynvml.NVML_THERMAL_TARGET_ALL", "vllm.third_party.pynvml.NVML_THERMAL_TARGET_BOARD", "vllm.third_party.pynvml.NVML_THERMAL_TARGET_GPU", "vllm.third_party.pynvml.NVML_THERMAL_TARGET_MEMORY", "vllm.third_party.pynvml.NVML_THERMAL_TARGET_NONE", "vllm.third_party.pynvml.NVML_THERMAL_TARGET_POWER_SUPPLY", "vllm.third_party.pynvml.NVML_THERMAL_TARGET_UNKNOWN", "vllm.third_party.pynvml.NVML_THERMAL_TARGET_VCD_BOARD", "vllm.third_party.pynvml.NVML_THERMAL_TARGET_VCD_INLET", "vllm.third_party.pynvml.NVML_THERMAL_TARGET_VCD_OUTLET", "vllm.third_party.pynvml.NVML_TOPOLOGY_HOSTBRIDGE", "vllm.third_party.pynvml.NVML_TOPOLOGY_INTERNAL", "vllm.third_party.pynvml.NVML_TOPOLOGY_MULTIPLE", "vllm.third_party.pynvml.NVML_TOPOLOGY_NODE", "vllm.third_party.pynvml.NVML_TOPOLOGY_SINGLE", "vllm.third_party.pynvml.NVML_TOPOLOGY_SYSTEM", "vllm.third_party.pynvml.NVML_TOTAL_POWER_SAMPLES", "vllm.third_party.pynvml.NVML_VALUE_NOT_AVAILABLE_uint", "vllm.third_party.pynvml.NVML_VALUE_NOT_AVAILABLE_ulonglong", "vllm.third_party.pynvml.NVML_VALUE_TYPE_COUNT", "vllm.third_party.pynvml.NVML_VALUE_TYPE_DOUBLE", "vllm.third_party.pynvml.NVML_VALUE_TYPE_SIGNED_INT", "vllm.third_party.pynvml.NVML_VALUE_TYPE_SIGNED_LONG_LONG", "vllm.third_party.pynvml.NVML_VALUE_TYPE_UNSIGNED_INT", "vllm.third_party.pynvml.NVML_VALUE_TYPE_UNSIGNED_LONG", "vllm.third_party.pynvml.NVML_VALUE_TYPE_UNSIGNED_LONG_LONG", "vllm.third_party.pynvml.NVML_VALUE_TYPE_UNSIGNED_SHORT", "vllm.third_party.pynvml.NVML_VGPU_CAP_COUNT", "vllm.third_party.pynvml.NVML_VGPU_CAP_EXCLUSIVE_SIZE", "vllm.third_party.pynvml.NVML_VGPU_CAP_EXCLUSIVE_TYPE", "vllm.third_party.pynvml.NVML_VGPU_CAP_GPUDIRECT", "vllm.third_party.pynvml.NVML_VGPU_CAP_MULTI_VGPU_EXCLUSIVE", "vllm.third_party.pynvml.NVML_VGPU_CAP_NVLINK_P2P", "vllm.third_party.pynvml.NVML_VGPU_COMPATIBILITY_LIMIT_GPU", "vllm.third_party.pynvml.NVML_VGPU_COMPATIBILITY_LIMIT_GUEST_DRIVER", "vllm.third_party.pynvml.NVML_VGPU_COMPATIBILITY_LIMIT_HOST_DRIVER", "vllm.third_party.pynvml.NVML_VGPU_COMPATIBILITY_LIMIT_NONE", "vllm.third_party.pynvml.NVML_VGPU_COMPATIBILITY_LIMIT_OTHER", "vllm.third_party.pynvml.NVML_VGPU_DRIVER_CAP_COUNT", "vllm.third_party.pynvml.NVML_VGPU_DRIVER_CAP_HETEROGENEOUS_MULTI_VGPU", "vllm.third_party.pynvml.NVML_VGPU_DRIVER_CAP_WARM_UPDATE", "vllm.third_party.pynvml.NVML_VGPU_INSTANCE_GUEST_INFO_STATE_INITIALIZED", "vllm.third_party.pynvml.NVML_VGPU_INSTANCE_GUEST_INFO_STATE_UNINITIALIZED", "vllm.third_party.pynvml.NVML_VGPU_METADATA_OPAQUE_DATA_SIZE", "vllm.third_party.pynvml.NVML_VGPU_NAME_BUFFER_SIZE", "vllm.third_party.pynvml.NVML_VGPU_PGPU_HETEROGENEOUS_MODE", "vllm.third_party.pynvml.NVML_VGPU_PGPU_HOMOGENEOUS_MODE", "vllm.third_party.pynvml.NVML_VGPU_PGPU_METADATA_OPAQUE_DATA_SIZE", "vllm.third_party.pynvml.NVML_VGPU_SCHEDULER_ARR_DEFAULT", "vllm.third_party.pynvml.NVML_VGPU_SCHEDULER_ARR_DISABLE", "vllm.third_party.pynvml.NVML_VGPU_SCHEDULER_ARR_ENABLE", "vllm.third_party.pynvml.NVML_VGPU_SCHEDULER_POLICY_BEST_EFFORT", "vllm.third_party.pynvml.NVML_VGPU_SCHEDULER_POLICY_EQUAL_SHARE", "vllm.third_party.pynvml.NVML_VGPU_SCHEDULER_POLICY_FIXED_SHARE", "vllm.third_party.pynvml.NVML_VGPU_SCHEDULER_POLICY_UNKNOWN", "vllm.third_party.pynvml.NVML_VGPU_VM_COMPATIBILITY_COLD", "vllm.third_party.pynvml.NVML_VGPU_VM_COMPATIBILITY_HIBERNATE", "vllm.third_party.pynvml.NVML_VGPU_VM_COMPATIBILITY_LIVE", "vllm.third_party.pynvml.NVML_VGPU_VM_COMPATIBILITY_NONE", "vllm.third_party.pynvml.NVML_VGPU_VM_COMPATIBILITY_SLEEP", "vllm.third_party.pynvml.NVML_VGPU_VM_ID_DOMAIN_ID", "vllm.third_party.pynvml.NVML_VGPU_VM_ID_UUID", "vllm.third_party.pynvml.NVML_VOLATILE_ECC", "vllm.third_party.pynvml.NVML_WORKLOAD_POWER_MAX_PROFILES", "vllm.third_party.pynvml.ProcessesUtilizationInfo_v1", "vllm.third_party.pynvml.SystemDriverBranchInfo_v1", "vllm.third_party.pynvml.VgpuHeterogeneousMode_v1", "vllm.third_party.pynvml.VgpuInstancesUtilizationInfo_v1", "vllm.third_party.pynvml.VgpuPlacementId_v1", "vllm.third_party.pynvml.VgpuPlacementList_v1", "vllm.third_party.pynvml.VgpuPlacementList_v2", "vllm.third_party.pynvml.VgpuProcessesUtilizationInfo_v1", "vllm.third_party.pynvml.VgpuRuntimeState_v1", "vllm.third_party.pynvml.VgpuTypeBar1Info_v1", "vllm.third_party.pynvml.c_metricInfo_t", "vllm.third_party.pynvml.c_nvmlAccountingStats_t", "vllm.third_party.pynvml.c_nvmlBAR1Memory_t", "vllm.third_party.pynvml.c_nvmlBridgeChipHierarchy_t", "vllm.third_party.pynvml.c_nvmlBridgeChipInfo_t", "vllm.third_party.pynvml.c_nvmlC2cModeInfo_v1_t", "vllm.third_party.pynvml.c_nvmlClockOffset_t", "vllm.third_party.pynvml.c_nvmlComputeInstanceInfo_t", "vllm.third_party.pynvml.c_nvmlComputeInstancePlacement_t", "vllm.third_party.pynvml.c_nvmlComputeInstanceProfileInfo_t", "vllm.third_party.pynvml.c_nvmlComputeInstanceProfileInfo_v2_t", "vllm.third_party.pynvml.c_nvmlComputeInstance_t", "vllm.third_party.pynvml.c_nvmlConfComputeGetKeyRotationThresholdInfo_t", "vllm.third_party.pynvml.c_nvmlConfComputeGpuAttestationReport_t", "vllm.third_party.pynvml.c_nvmlConfComputeGpuCertificate_t", "vllm.third_party.pynvml.c_nvmlConfComputeMemSizeInfo_t", "vllm.third_party.pynvml.c_nvmlConfComputeSetKeyRotationThresholdInfo_t", "vllm.third_party.pynvml.c_nvmlConfComputeSystemCaps_t", "vllm.third_party.pynvml.c_nvmlConfComputeSystemState_t", "vllm.third_party.pynvml.c_nvmlCoolerInfo_t", "vllm.third_party.pynvml.c_nvmlDeviceAttributes", "vllm.third_party.pynvml.c_nvmlDeviceCapabilities_v1_t", "vllm.third_party.pynvml.c_nvmlDeviceCurrentClockFreqs_v1_t", "vllm.third_party.pynvml.c_nvmlDevicePerfModes_v1_t", "vllm.third_party.pynvml.c_nvmlDevice_t", "vllm.third_party.pynvml.c_nvmlDramEncryptionInfo_t", "vllm.third_party.pynvml.c_nvmlEccErrorCounts_t", "vllm.third_party.pynvml.c_nvmlEccSramErrorStatus_v1_t", "vllm.third_party.pynvml.c_nvmlEncoderSession_t", "vllm.third_party.pynvml.c_nvmlEventData_t", "vllm.third_party.pynvml.c_nvmlEventSet_t", "vllm.third_party.pynvml.c_nvmlExcludedDeviceInfo_t", "vllm.third_party.pynvml.c_nvmlFBCSession_t", "vllm.third_party.pynvml.c_nvmlFBCStats_t", "vllm.third_party.pynvml.c_nvmlFanSpeedInfo_t", "vllm.third_party.pynvml.c_nvmlFieldValue_t", "vllm.third_party.pynvml.c_nvmlGpmMetric_t", "vllm.third_party.pynvml.c_nvmlGpmMetricsGet_t", "vllm.third_party.pynvml.c_nvmlGpmSample_t", "vllm.third_party.pynvml.c_nvmlGpmSupport_t", "vllm.third_party.pynvml.c_nvmlGpuDynamicPstatesInfo_t", "vllm.third_party.pynvml.c_nvmlGpuDynamicPstatesUtilization_t", "vllm.third_party.pynvml.c_nvmlGpuFabricInfoV_t", "vllm.third_party.pynvml.c_nvmlGpuFabricInfo_t", "vllm.third_party.pynvml.c_nvmlGpuInstanceInfo_t", "vllm.third_party.pynvml.c_nvmlGpuInstancePlacement_t", "vllm.third_party.pynvml.c_nvmlGpuInstanceProfileInfo_t", "vllm.third_party.pynvml.c_nvmlGpuInstanceProfileInfo_v2_t", "vllm.third_party.pynvml.c_nvmlGpuInstance_t", "vllm.third_party.pynvml.c_nvmlGpuThermalSensor_t", "vllm.third_party.pynvml.c_nvmlGpuThermalSettings_t", "vllm.third_party.pynvml.c_nvmlGridLicensableFeature_t", "vllm.third_party.pynvml.c_nvmlGridLicensableFeature_v2_t", "vllm.third_party.pynvml.c_nvmlGridLicensableFeature_v3_t", "vllm.third_party.pynvml.c_nvmlGridLicensableFeature_v4_t", "vllm.third_party.pynvml.c_nvmlGridLicensableFeatures_t", "vllm.third_party.pynvml.c_nvmlGridLicensableFeatures_v2_t", "vllm.third_party.pynvml.c_nvmlGridLicensableFeatures_v3_t", "vllm.third_party.pynvml.c_nvmlGridLicensableFeatures_v4_t", "vllm.third_party.pynvml.c_nvmlGridLicenseExpiry_t", "vllm.third_party.pynvml.c_nvmlHwbcEntry_t", "vllm.third_party.pynvml.c_nvmlLedState_t", "vllm.third_party.pynvml.c_nvmlMarginTemperature_v1_t", "vllm.third_party.pynvml.c_nvmlMask255_t", "vllm.third_party.pynvml.c_nvmlMemory_t", "vllm.third_party.pynvml.c_nvmlMemory_v2_t", "vllm.third_party.pynvml.c_nvmlNvLinkPowerThres_t", "vllm.third_party.pynvml.c_nvmlNvlinkGetBwMode_v1_t", "vllm.third_party.pynvml.c_nvmlNvlinkSetBwMode_v1_t", "vllm.third_party.pynvml.c_nvmlNvlinkSupportedBwModes_v1_t", "vllm.third_party.pynvml.c_nvmlPSUInfo_t", "vllm.third_party.pynvml.c_nvmlPlatformInfo_v1_t", "vllm.third_party.pynvml.c_nvmlPowerSmoothingProfile_v1_t", "vllm.third_party.pynvml.c_nvmlPowerSmoothingState_v1_t", "vllm.third_party.pynvml.c_nvmlPowerValue_v2_t", "vllm.third_party.pynvml.c_nvmlProcessDetailList_v1_t", "vllm.third_party.pynvml.c_nvmlProcessDetail_v1_t", "vllm.third_party.pynvml.c_nvmlProcessInfo_v2_t", "vllm.third_party.pynvml.c_nvmlProcessUtilizationInfo_v1_t", "vllm.third_party.pynvml.c_nvmlProcessUtilizationSample_t", "vllm.third_party.pynvml.c_nvmlProcessesUtilizationInfo_v1_t", "vllm.third_party.pynvml.c_nvmlRowRemapperHistogramValues", "vllm.third_party.pynvml.c_nvmlSample_t", "vllm.third_party.pynvml.c_nvmlSystemConfComputeSettings_v1_t", "vllm.third_party.pynvml.c_nvmlSystemDriverBranchInfo_v1_t", "vllm.third_party.pynvml.c_nvmlTemperature_v1_t", "vllm.third_party.pynvml.c_nvmlUnitFanInfo_t", "vllm.third_party.pynvml.c_nvmlUnitFanSpeeds_t", "vllm.third_party.pynvml.c_nvmlUnitInfo_t", "vllm.third_party.pynvml.c_nvmlUnit_t", "vllm.third_party.pynvml.c_nvmlUtilization_t", "vllm.third_party.pynvml.c_nvmlValue_t", "vllm.third_party.pynvml.c_nvmlVgpuHeterogeneousMode_v1_t", "vllm.third_party.pynvml.c_nvmlVgpuInstanceUtilizationInfo_v1_t", "vllm.third_party.pynvml.c_nvmlVgpuInstanceUtilizationSample_t", "vllm.third_party.pynvml.c_nvmlVgpuInstancesUtilizationInfo_v1_t", "vllm.third_party.pynvml.c_nvmlVgpuLicenseExpiry_t", "vllm.third_party.pynvml.c_nvmlVgpuLicenseInfo_t", "vllm.third_party.pynvml.c_nvmlVgpuMetadata_t", "vllm.third_party.pynvml.c_nvmlVgpuPgpuCompatibility_t", "vllm.third_party.pynvml.c_nvmlVgpuPgpuMetadata_t", "vllm.third_party.pynvml.c_nvmlVgpuPlacementId_v1_t", "vllm.third_party.pynvml.c_nvmlVgpuPlacementList_v1_t", "vllm.third_party.pynvml.c_nvmlVgpuPlacementList_v2_t", "vllm.third_party.pynvml.c_nvmlVgpuProcessUtilizationInfo_v1_t", "vllm.third_party.pynvml.c_nvmlVgpuProcessUtilizationSample_t", "vllm.third_party.pynvml.c_nvmlVgpuProcessesUtilizationInfo_v1_t", "vllm.third_party.pynvml.c_nvmlVgpuSchedDataWithARR_t", "vllm.third_party.pynvml.c_nvmlVgpuSchedData_t", "vllm.third_party.pynvml.c_nvmlVgpuSchedSetDataWithARR_t", "vllm.third_party.pynvml.c_nvmlVgpuSchedSetData_t", "vllm.third_party.pynvml.c_nvmlVgpuSchedulerCapabilities_t", "vllm.third_party.pynvml.c_nvmlVgpuSchedulerGetState_t", "vllm.third_party.pynvml.c_nvmlVgpuSchedulerLogEntry_t", "vllm.third_party.pynvml.c_nvmlVgpuSchedulerLog_t", "vllm.third_party.pynvml.c_nvmlVgpuSchedulerParams_t", "vllm.third_party.pynvml.c_nvmlVgpuSchedulerSetParams_t", "vllm.third_party.pynvml.c_nvmlVgpuSchedulerSetState_t", "vllm.third_party.pynvml.c_nvmlVgpuTypeBar1Info_v1_t", "vllm.third_party.pynvml.c_nvmlVgpuVersion_t", "vllm.third_party.pynvml.c_nvmlViolationTime_t", "vllm.third_party.pynvml.c_nvmlWorkloadPowerProfileCurrentProfiles_v1_t", "vllm.third_party.pynvml.c_nvmlWorkloadPowerProfileInfo_v1_t", "vllm.third_party.pynvml.c_nvmlWorkloadPowerProfileProfilesInfo_v1_t", "vllm.third_party.pynvml.c_nvmlWorkloadPowerProfileRequestedProfiles_v1_t", "vllm.third_party.pynvml.convertStrBytes", "vllm.third_party.pynvml.libLoadLock", "vllm.third_party.pynvml.nvmlC2cModeInfo_v1", "vllm.third_party.pynvml.nvmlClkMonFaultInfo_t", "vllm.third_party.pynvml.nvmlClkMonStatus_t", "vllm.third_party.pynvml.nvmlClockOffset_v1", "vllm.third_party.pynvml.nvmlClocksEventReasonAll", "vllm.third_party.pynvml.nvmlClocksEventReasonApplicationsClocksSetting", "vllm.third_party.pynvml.nvmlClocksEventReasonDisplayClockSetting", "vllm.third_party.pynvml.nvmlClocksEventReasonGpuIdle", "vllm.third_party.pynvml.nvmlClocksEventReasonHwPowerBrakeSlowdown", "vllm.third_party.pynvml.nvmlClocksEventReasonHwSlowdown", "vllm.third_party.pynvml.nvmlClocksEventReasonHwThermalSlowdown", "vllm.third_party.pynvml.nvmlClocksEventReasonNone", "vllm.third_party.pynvml.nvmlClocksEventReasonSwPowerCap", "vllm.third_party.pynvml.nvmlClocksEventReasonSwThermalSlowdown", "vllm.third_party.pynvml.nvmlClocksEventReasonSyncBoost", "vllm.third_party.pynvml.nvmlClocksThrottleReasonAll", "vllm.third_party.pynvml.nvmlClocksThrottleReasonApplicationsClocksSetting", "vllm.third_party.pynvml.nvmlClocksThrottleReasonDisplayClockSetting", "vllm.third_party.pynvml.nvmlClocksThrottleReasonGpuIdle", "vllm.third_party.pynvml.nvmlClocksThrottleReasonHwPowerBrakeSlowdown", "vllm.third_party.pynvml.nvmlClocksThrottleReasonHwSlowdown", "vllm.third_party.pynvml.nvmlClocksThrottleReasonHwThermalSlowdown", "vllm.third_party.pynvml.nvmlClocksThrottleReasonNone", "vllm.third_party.pynvml.nvmlClocksThrottleReasonSwPowerCap", "vllm.third_party.pynvml.nvmlClocksThrottleReasonSwThermalSlowdown", "vllm.third_party.pynvml.nvmlClocksThrottleReasonSyncBoost", "vllm.third_party.pynvml.nvmlComputeInstanceDestroy", "vllm.third_party.pynvml.nvmlComputeInstanceGetInfo", "vllm.third_party.pynvml.nvmlComputeInstanceGetInfo_v2", "vllm.third_party.pynvml.nvmlComputeInstanceProfileInfo_v2", "vllm.third_party.pynvml.nvmlCoolerInfo_v1", "vllm.third_party.pynvml.nvmlDeviceCapabilities_v1", "vllm.third_party.pynvml.nvmlDeviceClearAccountingPids", "vllm.third_party.pynvml.nvmlDeviceClearCpuAffinity", "vllm.third_party.pynvml.nvmlDeviceClearEccErrorCounts", "vllm.third_party.pynvml.nvmlDeviceClearFieldValues", "vllm.third_party.pynvml.nvmlDeviceCreateGpuInstance", "vllm.third_party.pynvml.nvmlDeviceCreateGpuInstanceWithPlacement", "vllm.third_party.pynvml.nvmlDeviceCurrentClockFreqs_v1", "vllm.third_party.pynvml.nvmlDeviceDiscoverGpus", "vllm.third_party.pynvml.nvmlDeviceFreezeNvLinkUtilizationCounter", "vllm.third_party.pynvml.nvmlDeviceGetAPIRestriction", "vllm.third_party.pynvml.nvmlDeviceGetAccountingBufferSize", "vllm.third_party.pynvml.nvmlDeviceGetAccountingMode", "vllm.third_party.pynvml.nvmlDeviceGetAccountingPids", "vllm.third_party.pynvml.nvmlDeviceGetAccountingStats", "vllm.third_party.pynvml.nvmlDeviceGetActiveVgpus", "vllm.third_party.pynvml.nvmlDeviceGetAdaptiveClockInfoStatus", "vllm.third_party.pynvml.nvmlDeviceGetApplicationsClock", "vllm.third_party.pynvml.nvmlDeviceGetArchitecture", "vllm.third_party.pynvml.nvmlDeviceGetAttributes", "vllm.third_party.pynvml.nvmlDeviceGetAttributes_v2", "vllm.third_party.pynvml.nvmlDeviceGetAutoBoostedClocksEnabled", "vllm.third_party.pynvml.nvmlDeviceGetBAR1MemoryInfo", "vllm.third_party.pynvml.nvmlDeviceGetBoardId", "vllm.third_party.pynvml.nvmlDeviceGetBoardPartNumber", "vllm.third_party.pynvml.nvmlDeviceGetBrand", "vllm.third_party.pynvml.nvmlDeviceGetBridgeChipInfo", "vllm.third_party.pynvml.nvmlDeviceGetBusType", "vllm.third_party.pynvml.nvmlDeviceGetC2cModeInfoV", "vllm.third_party.pynvml.nvmlDeviceGetC2cModeInfoV1", "vllm.third_party.pynvml.nvmlDeviceGetCapabilities", "vllm.third_party.pynvml.nvmlDeviceGetClkMonStatus", "vllm.third_party.pynvml.nvmlDeviceGetClock", "vllm.third_party.pynvml.nvmlDeviceGetClockInfo", "vllm.third_party.pynvml.nvmlDeviceGetClockOffsets", "vllm.third_party.pynvml.nvmlDeviceGetComputeInstanceId", "vllm.third_party.pynvml.nvmlDeviceGetComputeMode", "vllm.third_party.pynvml.nvmlDeviceGetComputeRunningProcesses", "vllm.third_party.pynvml.nvmlDeviceGetComputeRunningProcesses_v2", "vllm.third_party.pynvml.nvmlDeviceGetComputeRunningProcesses_v3", "vllm.third_party.pynvml.nvmlDeviceGetConfComputeGpuAttestationReport", "vllm.third_party.pynvml.nvmlDeviceGetConfComputeGpuCertificate", "vllm.third_party.pynvml.nvmlDeviceGetConfComputeMemSizeInfo", "vllm.third_party.pynvml.nvmlDeviceGetConfComputeProtectedMemoryUsage", "vllm.third_party.pynvml.nvmlDeviceGetCoolerInfo", "vllm.third_party.pynvml.nvmlDeviceGetCount", "vllm.third_party.pynvml.nvmlDeviceGetCpuAffinity", "vllm.third_party.pynvml.nvmlDeviceGetCpuAffinityWithinScope", "vllm.third_party.pynvml.nvmlDeviceGetCreatableVgpus", "vllm.third_party.pynvml.nvmlDeviceGetCudaComputeCapability", "vllm.third_party.pynvml.nvmlDeviceGetCurrPcieLinkGeneration", "vllm.third_party.pynvml.nvmlDeviceGetCurrPcieLinkWidth", "vllm.third_party.pynvml.nvmlDeviceGetCurrentClockFreqs", "vllm.third_party.pynvml.nvmlDeviceGetCurrentClocksEventReasons", "vllm.third_party.pynvml.nvmlDeviceGetCurrentClocksThrottleReasons", "vllm.third_party.pynvml.nvmlDeviceGetCurrentDramEncryptionMode", "vllm.third_party.pynvml.nvmlDeviceGetCurrentDriverModel", "vllm.third_party.pynvml.nvmlDeviceGetCurrentEccMode", "vllm.third_party.pynvml.nvmlDeviceGetCurrentGpuOperationMode", "vllm.third_party.pynvml.nvmlDeviceGetDecoderUtilization", "vllm.third_party.pynvml.nvmlDeviceGetDefaultApplicationsClock", "vllm.third_party.pynvml.nvmlDeviceGetDefaultEccMode", "vllm.third_party.pynvml.nvmlDeviceGetDetailedEccErrors", "vllm.third_party.pynvml.nvmlDeviceGetDeviceHandleFromMigDeviceHandle", "vllm.third_party.pynvml.nvmlDeviceGetDisplayActive", "vllm.third_party.pynvml.nvmlDeviceGetDisplayMode", "vllm.third_party.pynvml.nvmlDeviceGetDramEncryptionMode", "vllm.third_party.pynvml.nvmlDeviceGetDriverModel", "vllm.third_party.pynvml.nvmlDeviceGetDynamicPstatesInfo", "vllm.third_party.pynvml.nvmlDeviceGetEccMode", "vllm.third_party.pynvml.nvmlDeviceGetEncoderCapacity", "vllm.third_party.pynvml.nvmlDeviceGetEncoderSessions", "vllm.third_party.pynvml.nvmlDeviceGetEncoderStats", "vllm.third_party.pynvml.nvmlDeviceGetEncoderUtilization", "vllm.third_party.pynvml.nvmlDeviceGetEnforcedPowerLimit", "vllm.third_party.pynvml.nvmlDeviceGetFBCSessions", "vllm.third_party.pynvml.nvmlDeviceGetFBCStats", "vllm.third_party.pynvml.nvmlDeviceGetFanControlPolicy_v2", "vllm.third_party.pynvml.nvmlDeviceGetFanSpeed", "vllm.third_party.pynvml.nvmlDeviceGetFanSpeedRPM", "vllm.third_party.pynvml.nvmlDeviceGetFanSpeed_v2", "vllm.third_party.pynvml.nvmlDeviceGetFieldValues", "vllm.third_party.pynvml.nvmlDeviceGetGpcClkMinMaxVfOffset", "vllm.third_party.pynvml.nvmlDeviceGetGpcClkVfOffset", "vllm.third_party.pynvml.nvmlDeviceGetGpuFabricInfo", "vllm.third_party.pynvml.nvmlDeviceGetGpuFabricInfoV", "vllm.third_party.pynvml.nvmlDeviceGetGpuInstanceById", "vllm.third_party.pynvml.nvmlDeviceGetGpuInstanceId", "vllm.third_party.pynvml.nvmlDeviceGetGpuInstancePossiblePlacements", "vllm.third_party.pynvml.nvmlDeviceGetGpuInstanceProfileInfo", "vllm.third_party.pynvml.nvmlDeviceGetGpuInstanceRemainingCapacity", "vllm.third_party.pynvml.nvmlDeviceGetGpuInstances", "vllm.third_party.pynvml.nvmlDeviceGetGpuMaxPcieLinkGeneration", "vllm.third_party.pynvml.nvmlDeviceGetGpuOperationMode", "vllm.third_party.pynvml.nvmlDeviceGetGraphicsRunningProcesses", "vllm.third_party.pynvml.nvmlDeviceGetGraphicsRunningProcesses_v2", "vllm.third_party.pynvml.nvmlDeviceGetGraphicsRunningProcesses_v3", "vllm.third_party.pynvml.nvmlDeviceGetGridLicensableFeatures", "vllm.third_party.pynvml.nvmlDeviceGetGridLicensableFeatures_v4", "vllm.third_party.pynvml.nvmlDeviceGetGspFirmwareMode", "vllm.third_party.pynvml.nvmlDeviceGetGspFirmwareVersion", "vllm.third_party.pynvml.nvmlDeviceGetHandleByIndex", "vllm.third_party.pynvml.nvmlDeviceGetHandleByPciBusId", "vllm.third_party.pynvml.nvmlDeviceGetHandleBySerial", "vllm.third_party.pynvml.nvmlDeviceGetHandleByUUID", "vllm.third_party.pynvml.nvmlDeviceGetHostVgpuMode", "vllm.third_party.pynvml.nvmlDeviceGetIndex", "vllm.third_party.pynvml.nvmlDeviceGetInforomConfigurationChecksum", "vllm.third_party.pynvml.nvmlDeviceGetInforomImageVersion", "vllm.third_party.pynvml.nvmlDeviceGetInforomVersion", "vllm.third_party.pynvml.nvmlDeviceGetIrqNum", "vllm.third_party.pynvml.nvmlDeviceGetJpgUtilization", "vllm.third_party.pynvml.nvmlDeviceGetLastBBXFlushTime", "vllm.third_party.pynvml.nvmlDeviceGetMPSComputeRunningProcesses", "vllm.third_party.pynvml.nvmlDeviceGetMPSComputeRunningProcesses_v2", "vllm.third_party.pynvml.nvmlDeviceGetMPSComputeRunningProcesses_v3", "vllm.third_party.pynvml.nvmlDeviceGetMarginTemperature", "vllm.third_party.pynvml.nvmlDeviceGetMaxClockInfo", "vllm.third_party.pynvml.nvmlDeviceGetMaxCustomerBoostClock", "vllm.third_party.pynvml.nvmlDeviceGetMaxMigDeviceCount", "vllm.third_party.pynvml.nvmlDeviceGetMaxPcieLinkGeneration", "vllm.third_party.pynvml.nvmlDeviceGetMaxPcieLinkWidth", "vllm.third_party.pynvml.nvmlDeviceGetMemClkMinMaxVfOffset", "vllm.third_party.pynvml.nvmlDeviceGetMemClkVfOffset", "vllm.third_party.pynvml.nvmlDeviceGetMemoryAffinity", "vllm.third_party.pynvml.nvmlDeviceGetMemoryBusWidth", "vllm.third_party.pynvml.nvmlDeviceGetMemoryErrorCounter", "vllm.third_party.pynvml.nvmlDeviceGetMemoryInfo", "vllm.third_party.pynvml.nvmlDeviceGetMigDeviceHandleByIndex", "vllm.third_party.pynvml.nvmlDeviceGetMigMode", "vllm.third_party.pynvml.nvmlDeviceGetMinMaxClockOfPState", "vllm.third_party.pynvml.nvmlDeviceGetMinMaxFanSpeed", "vllm.third_party.pynvml.nvmlDeviceGetMinorNumber", "vllm.third_party.pynvml.nvmlDeviceGetModuleId", "vllm.third_party.pynvml.nvmlDeviceGetMultiGpuBoard", "vllm.third_party.pynvml.nvmlDeviceGetName", "vllm.third_party.pynvml.nvmlDeviceGetNumFans", "vllm.third_party.pynvml.nvmlDeviceGetNumGpuCores", "vllm.third_party.pynvml.nvmlDeviceGetNumaNodeId", "vllm.third_party.pynvml.nvmlDeviceGetNvLinkCapability", "vllm.third_party.pynvml.nvmlDeviceGetNvLinkErrorCounter", "vllm.third_party.pynvml.nvmlDeviceGetNvLinkRemoteDeviceType", "vllm.third_party.pynvml.nvmlDeviceGetNvLinkRemotePciInfo", "vllm.third_party.pynvml.nvmlDeviceGetNvLinkState", "vllm.third_party.pynvml.nvmlDeviceGetNvLinkUtilizationControl", "vllm.third_party.pynvml.nvmlDeviceGetNvLinkUtilizationCounter", "vllm.third_party.pynvml.nvmlDeviceGetNvLinkVersion", "vllm.third_party.pynvml.nvmlDeviceGetNvlinkBwMode", "vllm.third_party.pynvml.nvmlDeviceGetNvlinkSupportedBwModes", "vllm.third_party.pynvml.nvmlDeviceGetOfaUtilization", "vllm.third_party.pynvml.nvmlDeviceGetP2PStatus", "vllm.third_party.pynvml.nvmlDeviceGetPciInfo", "vllm.third_party.pynvml.nvmlDeviceGetPciInfoExt", "vllm.third_party.pynvml.nvmlDeviceGetPciInfo_v3", "vllm.third_party.pynvml.nvmlDeviceGetPcieLinkMaxSpeed", "vllm.third_party.pynvml.nvmlDeviceGetPcieReplayCounter", "vllm.third_party.pynvml.nvmlDeviceGetPcieSpeed", "vllm.third_party.pynvml.nvmlDeviceGetPcieThroughput", "vllm.third_party.pynvml.nvmlDeviceGetPendingDramEncryptionMode", "vllm.third_party.pynvml.nvmlDeviceGetPendingDriverModel", "vllm.third_party.pynvml.nvmlDeviceGetPendingEccMode", "vllm.third_party.pynvml.nvmlDeviceGetPendingGpuOperationMode", "vllm.third_party.pynvml.nvmlDeviceGetPerformanceModes", "vllm.third_party.pynvml.nvmlDeviceGetPerformanceState", "vllm.third_party.pynvml.nvmlDeviceGetPersistenceMode", "vllm.third_party.pynvml.nvmlDeviceGetPgpuMetadataString", "vllm.third_party.pynvml.nvmlDeviceGetPlatformInfo", "vllm.third_party.pynvml.nvmlDeviceGetPowerManagementDefaultLimit", "vllm.third_party.pynvml.nvmlDeviceGetPowerManagementLimit", "vllm.third_party.pynvml.nvmlDeviceGetPowerManagementLimitConstraints", "vllm.third_party.pynvml.nvmlDeviceGetPowerManagementMode", "vllm.third_party.pynvml.nvmlDeviceGetPowerSource", "vllm.third_party.pynvml.nvmlDeviceGetPowerState", "vllm.third_party.pynvml.nvmlDeviceGetPowerUsage", "vllm.third_party.pynvml.nvmlDeviceGetProcessUtilization", "vllm.third_party.pynvml.nvmlDeviceGetProcessesUtilizationInfo", "vllm.third_party.pynvml.nvmlDeviceGetRemappedRows", "vllm.third_party.pynvml.nvmlDeviceGetRetiredPages", "vllm.third_party.pynvml.nvmlDeviceGetRetiredPagesPendingStatus", "vllm.third_party.pynvml.nvmlDeviceGetRetiredPages_v2", "vllm.third_party.pynvml.nvmlDeviceGetRowRemapperHistogram", "vllm.third_party.pynvml.nvmlDeviceGetRunningProcessDetailList", "vllm.third_party.pynvml.nvmlDeviceGetSamples", "vllm.third_party.pynvml.nvmlDeviceGetSerial", "vllm.third_party.pynvml.nvmlDeviceGetSramEccErrorStatus", "vllm.third_party.pynvml.nvmlDeviceGetSupportedClocksEventReasons", "vllm.third_party.pynvml.nvmlDeviceGetSupportedClocksThrottleReasons", "vllm.third_party.pynvml.nvmlDeviceGetSupportedEventTypes", "vllm.third_party.pynvml.nvmlDeviceGetSupportedGraphicsClocks", "vllm.third_party.pynvml.nvmlDeviceGetSupportedMemoryClocks", "vllm.third_party.pynvml.nvmlDeviceGetSupportedPerformanceStates", "vllm.third_party.pynvml.nvmlDeviceGetSupportedVgpus", "vllm.third_party.pynvml.nvmlDeviceGetTargetFanSpeed", "vllm.third_party.pynvml.nvmlDeviceGetTemperature", "vllm.third_party.pynvml.nvmlDeviceGetTemperatureThreshold", "vllm.third_party.pynvml.nvmlDeviceGetTemperatureV", "vllm.third_party.pynvml.nvmlDeviceGetTemperatureV1", "vllm.third_party.pynvml.nvmlDeviceGetThermalSettings", "vllm.third_party.pynvml.nvmlDeviceGetTopologyCommonAncestor", "vllm.third_party.pynvml.nvmlDeviceGetTopologyNearestGpus", "vllm.third_party.pynvml.nvmlDeviceGetTotalEccErrors", "vllm.third_party.pynvml.nvmlDeviceGetTotalEnergyConsumption", "vllm.third_party.pynvml.nvmlDeviceGetUUID", "vllm.third_party.pynvml.nvmlDeviceGetUtilizationRates", "vllm.third_party.pynvml.nvmlDeviceGetVbiosVersion", "vllm.third_party.pynvml.nvmlDeviceGetVgpuCapabilities", "vllm.third_party.pynvml.nvmlDeviceGetVgpuHeterogeneousMode", "vllm.third_party.pynvml.nvmlDeviceGetVgpuInstancesUtilizationInfo", "vllm.third_party.pynvml.nvmlDeviceGetVgpuMetadata", "vllm.third_party.pynvml.nvmlDeviceGetVgpuProcessUtilization", "vllm.third_party.pynvml.nvmlDeviceGetVgpuProcessesUtilizationInfo", "vllm.third_party.pynvml.nvmlDeviceGetVgpuSchedulerCapabilities", "vllm.third_party.pynvml.nvmlDeviceGetVgpuSchedulerLog", "vllm.third_party.pynvml.nvmlDeviceGetVgpuSchedulerState", "vllm.third_party.pynvml.nvmlDeviceGetVgpuTypeCreatablePlacements", "vllm.third_party.pynvml.nvmlDeviceGetVgpuTypeSupportedPlacements", "vllm.third_party.pynvml.nvmlDeviceGetVgpuUtilization", "vllm.third_party.pynvml.nvmlDeviceGetViolationStatus", "vllm.third_party.pynvml.nvmlDeviceGetVirtualizationMode", "vllm.third_party.pynvml.nvmlDeviceIsMigDeviceHandle", "vllm.third_party.pynvml.nvmlDeviceModifyDrainState", "vllm.third_party.pynvml.nvmlDeviceOnSameBoard", "vllm.third_party.pynvml.nvmlDevicePerfModes_v1", "vllm.third_party.pynvml.nvmlDevicePowerSmoothingActivatePresetProfile", "vllm.third_party.pynvml.nvmlDevicePowerSmoothingSetState", "vllm.third_party.pynvml.nvmlDevicePowerSmoothingUpdatePresetProfileParam", "vllm.third_party.pynvml.nvmlDeviceQueryDrainState", "vllm.third_party.pynvml.nvmlDeviceRegisterEvents", "vllm.third_party.pynvml.nvmlDeviceRemoveGpu", "vllm.third_party.pynvml.nvmlDeviceResetApplicationsClocks", "vllm.third_party.pynvml.nvmlDeviceResetGpuLockedClocks", "vllm.third_party.pynvml.nvmlDeviceResetMemoryLockedClocks", "vllm.third_party.pynvml.nvmlDeviceResetNvLinkErrorCounters", "vllm.third_party.pynvml.nvmlDeviceResetNvLinkUtilizationCounter", "vllm.third_party.pynvml.nvmlDeviceSetAPIRestriction", "vllm.third_party.pynvml.nvmlDeviceSetAccountingMode", "vllm.third_party.pynvml.nvmlDeviceSetApplicationsClocks", "vllm.third_party.pynvml.nvmlDeviceSetAutoBoostedClocksEnabled", "vllm.third_party.pynvml.nvmlDeviceSetClockOffsets", "vllm.third_party.pynvml.nvmlDeviceSetComputeMode", "vllm.third_party.pynvml.nvmlDeviceSetConfComputeUnprotectedMemSize", "vllm.third_party.pynvml.nvmlDeviceSetCpuAffinity", "vllm.third_party.pynvml.nvmlDeviceSetDefaultAutoBoostedClocksEnabled", "vllm.third_party.pynvml.nvmlDeviceSetDefaultFanSpeed_v2", "vllm.third_party.pynvml.nvmlDeviceSetDramEncryptionMode", "vllm.third_party.pynvml.nvmlDeviceSetDriverModel", "vllm.third_party.pynvml.nvmlDeviceSetEccMode", "vllm.third_party.pynvml.nvmlDeviceSetFanControlPolicy", "vllm.third_party.pynvml.nvmlDeviceSetFanSpeed_v2", "vllm.third_party.pynvml.nvmlDeviceSetGpcClkVfOffset", "vllm.third_party.pynvml.nvmlDeviceSetGpuLockedClocks", "vllm.third_party.pynvml.nvmlDeviceSetGpuOperationMode", "vllm.third_party.pynvml.nvmlDeviceSetMemClkVfOffset", "vllm.third_party.pynvml.nvmlDeviceSetMemoryLockedClocks", "vllm.third_party.pynvml.nvmlDeviceSetMigMode", "vllm.third_party.pynvml.nvmlDeviceSetNvLinkDeviceLowPowerThreshold", "vllm.third_party.pynvml.nvmlDeviceSetNvLinkUtilizationControl", "vllm.third_party.pynvml.nvmlDeviceSetNvlinkBwMode", "vllm.third_party.pynvml.nvmlDeviceSetPersistenceMode", "vllm.third_party.pynvml.nvmlDeviceSetPowerManagementLimit", "vllm.third_party.pynvml.nvmlDeviceSetPowerManagementLimit_v2", "vllm.third_party.pynvml.nvmlDeviceSetTemperatureThreshold", "vllm.third_party.pynvml.nvmlDeviceSetVgpuCapabilities", "vllm.third_party.pynvml.nvmlDeviceSetVgpuHeterogeneousMode", "vllm.third_party.pynvml.nvmlDeviceSetVgpuSchedulerState", "vllm.third_party.pynvml.nvmlDeviceSetVirtualizationMode", "vllm.third_party.pynvml.nvmlDeviceValidateInforom", "vllm.third_party.pynvml.nvmlDeviceWorkloadPowerProfileClearRequestedProfiles", "vllm.third_party.pynvml.nvmlDeviceWorkloadPowerProfileGetCurrentProfiles", "vllm.third_party.pynvml.nvmlDeviceWorkloadPowerProfileGetProfilesInfo", "vllm.third_party.pynvml.nvmlDeviceWorkloadPowerProfileSetRequestedProfiles", "vllm.third_party.pynvml.nvmlDramEncryptionInfo_v1", "vllm.third_party.pynvml.nvmlEccSramErrorStatus_v1", "vllm.third_party.pynvml.nvmlErrorString", "vllm.third_party.pynvml.nvmlEventMigConfigChange", "vllm.third_party.pynvml.nvmlEventSetCreate", "vllm.third_party.pynvml.nvmlEventSetFree", "vllm.third_party.pynvml.nvmlEventSetWait", "vllm.third_party.pynvml.nvmlEventSetWait_v2", "vllm.third_party.pynvml.nvmlEventTypeAll", "vllm.third_party.pynvml.nvmlEventTypeClock", "vllm.third_party.pynvml.nvmlEventTypeDoubleBitEccError", "vllm.third_party.pynvml.nvmlEventTypeDramRetirementEvent", "vllm.third_party.pynvml.nvmlEventTypeDramRetirementFailure", "vllm.third_party.pynvml.nvmlEventTypeFatalPoisonError", "vllm.third_party.pynvml.nvmlEventTypeGpuRecoveryAction", "vllm.third_party.pynvml.nvmlEventTypeGpuUnavailableError", "vllm.third_party.pynvml.nvmlEventTypeNonFatalPoisonError", "vllm.third_party.pynvml.nvmlEventTypeNone", "vllm.third_party.pynvml.nvmlEventTypePState", "vllm.third_party.pynvml.nvmlEventTypePowerSourceChange", "vllm.third_party.pynvml.nvmlEventTypeSingleBitEccError", "vllm.third_party.pynvml.nvmlEventTypeSingleBitEccErrorStorm", "vllm.third_party.pynvml.nvmlEventTypeXidCriticalError", "vllm.third_party.pynvml.nvmlExceptionClass", "vllm.third_party.pynvml.nvmlFanSpeedInfo_v1", "vllm.third_party.pynvml.nvmlFlagDefault", "vllm.third_party.pynvml.nvmlFlagForce", "vllm.third_party.pynvml.nvmlFriendlyObject", "vllm.third_party.pynvml.nvmlFriendlyObjectToStruct", "vllm.third_party.pynvml.nvmlGetExcludedDeviceCount", "vllm.third_party.pynvml.nvmlGetExcludedDeviceInfoByIndex", "vllm.third_party.pynvml.nvmlGetVgpuCompatibility", "vllm.third_party.pynvml.nvmlGetVgpuDriverCapabilities", "vllm.third_party.pynvml.nvmlGetVgpuVersion", "vllm.third_party.pynvml.nvmlGpmMetricsGet", "vllm.third_party.pynvml.nvmlGpmMigSampleGet", "vllm.third_party.pynvml.nvmlGpmQueryDeviceSupport", "vllm.third_party.pynvml.nvmlGpmQueryIfStreamingEnabled", "vllm.third_party.pynvml.nvmlGpmSampleAlloc", "vllm.third_party.pynvml.nvmlGpmSampleFree", "vllm.third_party.pynvml.nvmlGpmSampleGet", "vllm.third_party.pynvml.nvmlGpmSetStreamingEnabled", "vllm.third_party.pynvml.nvmlGpuFabricInfo_v2", "vllm.third_party.pynvml.nvmlGpuInstanceCreateComputeInstance", "vllm.third_party.pynvml.nvmlGpuInstanceCreateComputeInstanceWithPlacement", "vllm.third_party.pynvml.nvmlGpuInstanceDestroy", "vllm.third_party.pynvml.nvmlGpuInstanceGetComputeInstanceById", "vllm.third_party.pynvml.nvmlGpuInstanceGetComputeInstancePossiblePlacements", "vllm.third_party.pynvml.nvmlGpuInstanceGetComputeInstanceProfileInfo", "vllm.third_party.pynvml.nvmlGpuInstanceGetComputeInstanceRemainingCapacity", "vllm.third_party.pynvml.nvmlGpuInstanceGetComputeInstances", "vllm.third_party.pynvml.nvmlGpuInstanceGetInfo", "vllm.third_party.pynvml.nvmlGpuInstanceProfileInfo_v2", "vllm.third_party.pynvml.nvmlInit", "vllm.third_party.pynvml.nvmlInitWithFlags", "vllm.third_party.pynvml.nvmlLib", "vllm.third_party.pynvml.nvmlMarginTemperature_v1", "vllm.third_party.pynvml.nvmlMemory_v2", "vllm.third_party.pynvml.nvmlNvLinkUtilizationControl_t", "vllm.third_party.pynvml.nvmlNvlinkGetBwMode_v1", "vllm.third_party.pynvml.nvmlNvlinkSetBwMode_v1", "vllm.third_party.pynvml.nvmlNvlinkSupportedBwModes_v1", "vllm.third_party.pynvml.nvmlPciInfoExt_v1", "vllm.third_party.pynvml.nvmlPciInfoExt_v1_t", "vllm.third_party.pynvml.nvmlPciInfo_t", "vllm.third_party.pynvml.nvmlPciInfo_v2_t", "vllm.third_party.pynvml.nvmlPlatformInfo_v1", "vllm.third_party.pynvml.nvmlPowerSmoothingProfile_v1", "vllm.third_party.pynvml.nvmlPowerSmoothingState_v1", "vllm.third_party.pynvml.nvmlPowerValue_v2", "vllm.third_party.pynvml.nvmlProcessDetailList_v1", "vllm.third_party.pynvml.nvmlSetVgpuVersion", "vllm.third_party.pynvml.nvmlShutdown", "vllm.third_party.pynvml.nvmlStructToFriendlyObject", "vllm.third_party.pynvml.nvmlSystemConfComputeSettings_v1", "vllm.third_party.pynvml.nvmlSystemGetConfComputeCapabilities", "vllm.third_party.pynvml.nvmlSystemGetConfComputeGpusReadyState", "vllm.third_party.pynvml.nvmlSystemGetConfComputeKeyRotationThresholdInfo", "vllm.third_party.pynvml.nvmlSystemGetConfComputeSettings", "vllm.third_party.pynvml.nvmlSystemGetConfComputeState", "vllm.third_party.pynvml.nvmlSystemGetCudaDriverVersion", "vllm.third_party.pynvml.nvmlSystemGetCudaDriverVersion_v2", "vllm.third_party.pynvml.nvmlSystemGetDriverBranch", "vllm.third_party.pynvml.nvmlSystemGetDriverVersion", "vllm.third_party.pynvml.nvmlSystemGetHicVersion", "vllm.third_party.pynvml.nvmlSystemGetNVMLVersion", "vllm.third_party.pynvml.nvmlSystemGetNvlinkBwMode", "vllm.third_party.pynvml.nvmlSystemGetProcessName", "vllm.third_party.pynvml.nvmlSystemGetTopologyGpuSet", "vllm.third_party.pynvml.nvmlSystemSetConfComputeGpusReadyState", "vllm.third_party.pynvml.nvmlSystemSetConfComputeKeyRotationThresholdInfo", "vllm.third_party.pynvml.nvmlSystemSetNvlinkBwMode", "vllm.third_party.pynvml.nvmlTemperature_v1", "vllm.third_party.pynvml.nvmlUnitGetCount", "vllm.third_party.pynvml.nvmlUnitGetDeviceCount", "vllm.third_party.pynvml.nvmlUnitGetDevices", "vllm.third_party.pynvml.nvmlUnitGetFanSpeedInfo", "vllm.third_party.pynvml.nvmlUnitGetHandleByIndex", "vllm.third_party.pynvml.nvmlUnitGetLedState", "vllm.third_party.pynvml.nvmlUnitGetPsuInfo", "vllm.third_party.pynvml.nvmlUnitGetTemperature", "vllm.third_party.pynvml.nvmlUnitGetUnitInfo", "vllm.third_party.pynvml.nvmlUnitSetLedState", "vllm.third_party.pynvml.nvmlVgpuInstanceClearAccountingPids", "vllm.third_party.pynvml.nvmlVgpuInstanceGetAccountingMode", "vllm.third_party.pynvml.nvmlVgpuInstanceGetAccountingPids", "vllm.third_party.pynvml.nvmlVgpuInstanceGetAccountingStats", "vllm.third_party.pynvml.nvmlVgpuInstanceGetEccMode", "vllm.third_party.pynvml.nvmlVgpuInstanceGetEncoderCapacity", "vllm.third_party.pynvml.nvmlVgpuInstanceGetEncoderSessions", "vllm.third_party.pynvml.nvmlVgpuInstanceGetEncoderStats", "vllm.third_party.pynvml.nvmlVgpuInstanceGetFBCSessions", "vllm.third_party.pynvml.nvmlVgpuInstanceGetFBCStats", "vllm.third_party.pynvml.nvmlVgpuInstanceGetFbUsage", "vllm.third_party.pynvml.nvmlVgpuInstanceGetFrameRateLimit", "vllm.third_party.pynvml.nvmlVgpuInstanceGetGpuInstanceId", "vllm.third_party.pynvml.nvmlVgpuInstanceGetGpuPciId", "vllm.third_party.pynvml.nvmlVgpuInstanceGetLicenseInfo", "vllm.third_party.pynvml.nvmlVgpuInstanceGetLicenseInfo_v2", "vllm.third_party.pynvml.nvmlVgpuInstanceGetLicenseStatus", "vllm.third_party.pynvml.nvmlVgpuInstanceGetMdevUUID", "vllm.third_party.pynvml.nvmlVgpuInstanceGetMetadata", "vllm.third_party.pynvml.nvmlVgpuInstanceGetPlacementId", "vllm.third_party.pynvml.nvmlVgpuInstanceGetRuntimeStateSize", "vllm.third_party.pynvml.nvmlVgpuInstanceGetType", "vllm.third_party.pynvml.nvmlVgpuInstanceGetUUID", "vllm.third_party.pynvml.nvmlVgpuInstanceGetVmDriverVersion", "vllm.third_party.pynvml.nvmlVgpuInstanceGetVmID", "vllm.third_party.pynvml.nvmlVgpuInstanceSetEncoderCapacity", "vllm.third_party.pynvml.nvmlVgpuRuntimeState_v1_t", "vllm.third_party.pynvml.nvmlVgpuTypeGetBAR1Info", "vllm.third_party.pynvml.nvmlVgpuTypeGetCapabilities", "vllm.third_party.pynvml.nvmlVgpuTypeGetClass", "vllm.third_party.pynvml.nvmlVgpuTypeGetDeviceID", "vllm.third_party.pynvml.nvmlVgpuTypeGetFbReservation", "vllm.third_party.pynvml.nvmlVgpuTypeGetFrameRateLimit", "vllm.third_party.pynvml.nvmlVgpuTypeGetFramebufferSize", "vllm.third_party.pynvml.nvmlVgpuTypeGetGpuInstanceProfileId", "vllm.third_party.pynvml.nvmlVgpuTypeGetGspHeapSize", "vllm.third_party.pynvml.nvmlVgpuTypeGetLicense", "vllm.third_party.pynvml.nvmlVgpuTypeGetMaxInstances", "vllm.third_party.pynvml.nvmlVgpuTypeGetMaxInstancesPerVm", "vllm.third_party.pynvml.nvmlVgpuTypeGetName", "vllm.third_party.pynvml.nvmlVgpuTypeGetNumDisplayHeads", "vllm.third_party.pynvml.nvmlVgpuTypeGetResolution", "vllm.third_party.pynvml.nvmlWorkloadPowerProfileCurrentProfiles_v1", "vllm.third_party.pynvml.nvmlWorkloadPowerProfileInfo_v1", "vllm.third_party.pynvml.nvmlWorkloadPowerProfileProfilesInfo_v1", "vllm.third_party.pynvml.nvmlWorkloadPowerProfileRequestedProfiles_v1", "vllm.third_party.pynvml.struct_c_nvmlComputeInstance_t", "vllm.third_party.pynvml.struct_c_nvmlDevice_t", "vllm.third_party.pynvml.struct_c_nvmlEventSet_t", "vllm.third_party.pynvml.struct_c_nvmlGpmSample_t", "vllm.third_party.pynvml.struct_c_nvmlGpuInstance_t", "vllm.third_party.pynvml.struct_c_nvmlUnit_t", "vllm.third_party.pynvml.throwOnVersionMismatch" ], "n_typable": 980, "n_typed": 0, "n_any": 0, "n_untyped": 980, "n_functions": 375, "n_function_overloads": 375, "n_function_params": 563, "n_methods": 22, "n_method_overloads": 22, "n_method_params": 3, "n_classes": 135, "n_attrs": 1129, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/third_party/triton_kernels/compaction.py", "symbol_reports": [ { "kind": "function", "name": "vllm.third_party.triton_kernels.compaction.compaction", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.compaction.compaction_torch", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "type_ignores": [], "name": "vllm.third_party.triton_kernels.compaction", "names": [ "vllm.third_party.triton_kernels.compaction.compaction", "vllm.third_party.triton_kernels.compaction.compaction_torch" ], "n_typable": 10, "n_typed": 3, "n_any": 0, "n_untyped": 7, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 8, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/third_party/triton_kernels/distributed.py", "symbol_reports": [ { "kind": "function", "name": "vllm.third_party.triton_kernels.distributed.make_expt_assignment", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.distributed.make_expt_dict_random", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.distributed.symm_mem_pool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.distributed.make_expt_dict_uniform", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.distributed.SymmetricMemoryPool", "methods": [ { "kind": "function", "name": "SymmetricMemoryPool.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SymmetricMemoryPool.align_up", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SymmetricMemoryPool._reserve_region", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SymmetricMemoryPool.make_empty", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "SymmetricMemoryPool._initialize", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SymmetricMemoryPool.initialize_matmul_ogs", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SymmetricMemoryPool.size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SymmetricMemoryPool.buf", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SymmetricMemoryPool.bufs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SymmetricMemoryPool.hdl", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SymmetricMemoryPool.regions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 28, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 23, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.distributed.convert_dp_to_ep", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.distributed.convert_ep_to_dp", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.distributed.ExptAssignment", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ExptAssignment.expt_bitmask", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExptAssignment.expt_boolmask", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExptAssignment.expt_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExptAssignment.n_expts_per_shard", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.third_party.triton_kernels.distributed", "names": [ "vllm.third_party.triton_kernels.distributed.ExptAssignment", "vllm.third_party.triton_kernels.distributed.SymmetricMemoryPool", "vllm.third_party.triton_kernels.distributed.convert_dp_to_ep", "vllm.third_party.triton_kernels.distributed.convert_ep_to_dp", "vllm.third_party.triton_kernels.distributed.make_expt_assignment", "vllm.third_party.triton_kernels.distributed.make_expt_dict_random", "vllm.third_party.triton_kernels.distributed.make_expt_dict_uniform", "vllm.third_party.triton_kernels.distributed.symm_mem_pool" ], "n_typable": 56, "n_typed": 30, "n_any": 0, "n_untyped": 26, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 16, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 23, "n_classes": 2, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/third_party/triton_kernels/matmul_ogs.py", "symbol_reports": [ { "kind": "class", "name": "vllm.third_party.triton_kernels.matmul_ogs.FnName", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FnName.QUANTIZE_MXFP8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.matmul_ogs.Epilogue", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Epilogue.specs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Epilogue.fn_arg_values_matmul", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Epilogue.fn_arg_values_finalize", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Epilogue.effective_itemsize", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.matmul_ogs.matmul_ogs_set_idle_sms", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.matmul_ogs.FusedComm", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FusedComm.out_handles", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedComm.scatter_shard_indx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedComm.reduce_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedComm.n_reduce_shards", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.matmul_ogs.PrecisionConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PrecisionConfig.max_num_imprecise_acc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrecisionConfig.allow_tf32", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrecisionConfig.flex_ctx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrecisionConfig.acc_scale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrecisionConfig.flexpoint_saturate_inf", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrecisionConfig.report_quantization_err_fn", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrecisionConfig.act_scale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrecisionConfig.weight_scale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrecisionConfig.out_scale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrecisionConfig.out_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrecisionConfig.enforce_bitwise_invariance", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.matmul_ogs.FusedActivation", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FusedActivation.specs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FusedActivation.fn_args", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.matmul_ogs.get_swap_xw", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.matmul_ogs.post_matmul_comm_torch", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.matmul_ogs.init_allocation", "n_typed": 0, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.matmul_ogs.apply_allocation", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.matmul_ogs.matmul_ogs", "n_typed": 13, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.matmul_ogs.can_overflow_int32", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.matmul_ogs.RoutingData", "methods": [ { "kind": "function", "name": "RoutingData.n_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RoutingData.gate_scal", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RoutingData.expt_hist", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RoutingData.n_expts_tot", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RoutingData.n_expts_act", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RoutingData.expt_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RoutingData.expected_tokens_per_expt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.matmul_ogs.should_upcast_indices", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.matmul_ogs.GatherIndx", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "GatherIndx.src_indx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GatherIndx.dst_indx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.matmul_ogs.MatmulAllocation", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MatmulAllocation.device", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MatmulAllocation.output", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MatmulAllocation.scratchpads", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.matmul_ogs.matmul_ogs_torch", "n_typed": 5, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.matmul_ogs.ScatterIndx", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ScatterIndx.src_indx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScatterIndx.dst_indx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.matmul_ogs.FlexCtx", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FlexCtx.lhs_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexCtx.rhs_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexCtx.out_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexCtx.acc_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.matmul_ogs.InnerRoutingData", "methods": [ { "kind": "function", "name": "InnerRoutingData.make_kernel_args", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InnerRoutingData.base", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InnerRoutingData.block_k", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InnerRoutingData.x_is_padded", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InnerRoutingData.w_is_padded", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.matmul_ogs.specializations", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.third_party.triton_kernels.matmul_ogs", "names": [ "vllm.third_party.triton_kernels.matmul_ogs.Epilogue", "vllm.third_party.triton_kernels.matmul_ogs.FlexCtx", "vllm.third_party.triton_kernels.matmul_ogs.FnName", "vllm.third_party.triton_kernels.matmul_ogs.FusedActivation", "vllm.third_party.triton_kernels.matmul_ogs.FusedComm", "vllm.third_party.triton_kernels.matmul_ogs.GatherIndx", "vllm.third_party.triton_kernels.matmul_ogs.InnerRoutingData", "vllm.third_party.triton_kernels.matmul_ogs.MatmulAllocation", "vllm.third_party.triton_kernels.matmul_ogs.PrecisionConfig", "vllm.third_party.triton_kernels.matmul_ogs.RoutingData", "vllm.third_party.triton_kernels.matmul_ogs.ScatterIndx", "vllm.third_party.triton_kernels.matmul_ogs.apply_allocation", "vllm.third_party.triton_kernels.matmul_ogs.can_overflow_int32", "vllm.third_party.triton_kernels.matmul_ogs.get_swap_xw", "vllm.third_party.triton_kernels.matmul_ogs.init_allocation", "vllm.third_party.triton_kernels.matmul_ogs.matmul_ogs", "vllm.third_party.triton_kernels.matmul_ogs.matmul_ogs_set_idle_sms", "vllm.third_party.triton_kernels.matmul_ogs.matmul_ogs_torch", "vllm.third_party.triton_kernels.matmul_ogs.post_matmul_comm_torch", "vllm.third_party.triton_kernels.matmul_ogs.should_upcast_indices", "vllm.third_party.triton_kernels.matmul_ogs.specializations" ], "n_typable": 66, "n_typed": 25, "n_any": 0, "n_untyped": 41, "n_functions": 9, "n_function_overloads": 9, "n_function_params": 50, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_classes": 11, "n_attrs": 44, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/third_party/triton_kernels/numerics.py", "symbol_reports": [ { "kind": "class", "name": "vllm.third_party.triton_kernels.numerics.BaseFlexData", "methods": [ { "kind": "function", "name": "BaseFlexData.view", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseFlexData.reinterpret", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseFlexData.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.numerics.MAX_FINITE_FLOAT8E5", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.numerics.MAX_FINITE_FLOAT8E4NV", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.numerics.MAX_FINITE_FLOAT8E4B8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.numerics.InFlexData", "methods": [], "properties": [ { "kind": "property", "name": "InFlexData.is_per_batch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "InFlexData.scale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 1 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.numerics.OutFlexData", "methods": [ { "kind": "function", "name": "OutFlexData.__iter__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "OutFlexData.is_per_batch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "OutFlexData.expected_scale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OutFlexData.actual_scale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OutFlexData.checksum_scale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 3, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.third_party.triton_kernels.numerics", "names": [ "vllm.third_party.triton_kernels.numerics.BaseFlexData", "vllm.third_party.triton_kernels.numerics.InFlexData", "vllm.third_party.triton_kernels.numerics.MAX_FINITE_FLOAT8E4B8", "vllm.third_party.triton_kernels.numerics.MAX_FINITE_FLOAT8E4NV", "vllm.third_party.triton_kernels.numerics.MAX_FINITE_FLOAT8E5", "vllm.third_party.triton_kernels.numerics.OutFlexData" ], "n_typable": 7, "n_typed": 1, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_classes": 3, "n_attrs": 8, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/third_party/triton_kernels/numerics_details/flexpoint.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_MAX_FINITE_FLOAT8E4NV", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.flex_to_float", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_RCP_MAX_FINITE_FLOAT16", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.load_scale", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.sm86_min_nan_xorsign_abs_f32", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.update_scale", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_MAX_FINITE_FLOAT8E5", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_RCP_MAX_FINITE_FLOAT8E4B15", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_RCP_MAX_FINITE_FLOAT8E5", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_RCP_MAX_FINITE_FLOAT8E4NV", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.sm86_max_nan_xorsign_abs_f32", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_RCP_MAX_FINITE_FLOAT8E4B8", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.float_to_flex", "n_typed": 1, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.max_finite", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.compute_scale", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.nan_propagating_absmax_reduce", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_MAX_FINITE_FLOAT16", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_MAX_FINITE_FLOAT8E4B8", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.clip", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.rcp_max_finite", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_MAX_FINITE_FLOAT8E4B15", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.third_party.triton_kernels.numerics_details.flexpoint", "names": [ "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_MAX_FINITE_FLOAT16", "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_MAX_FINITE_FLOAT8E4B15", "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_MAX_FINITE_FLOAT8E4B8", "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_MAX_FINITE_FLOAT8E4NV", "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_MAX_FINITE_FLOAT8E5", "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_RCP_MAX_FINITE_FLOAT16", "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_RCP_MAX_FINITE_FLOAT8E4B15", "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_RCP_MAX_FINITE_FLOAT8E4B8", "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_RCP_MAX_FINITE_FLOAT8E4NV", "vllm.third_party.triton_kernels.numerics_details.flexpoint.TL_RCP_MAX_FINITE_FLOAT8E5", "vllm.third_party.triton_kernels.numerics_details.flexpoint.clip", "vllm.third_party.triton_kernels.numerics_details.flexpoint.compute_scale", "vllm.third_party.triton_kernels.numerics_details.flexpoint.flex_to_float", "vllm.third_party.triton_kernels.numerics_details.flexpoint.float_to_flex", "vllm.third_party.triton_kernels.numerics_details.flexpoint.load_scale", "vllm.third_party.triton_kernels.numerics_details.flexpoint.max_finite", "vllm.third_party.triton_kernels.numerics_details.flexpoint.nan_propagating_absmax_reduce", "vllm.third_party.triton_kernels.numerics_details.flexpoint.rcp_max_finite", "vllm.third_party.triton_kernels.numerics_details.flexpoint.sm86_max_nan_xorsign_abs_f32", "vllm.third_party.triton_kernels.numerics_details.flexpoint.sm86_min_nan_xorsign_abs_f32", "vllm.third_party.triton_kernels.numerics_details.flexpoint.update_scale" ], "n_typable": 46, "n_typed": 2, "n_any": 0, "n_untyped": 44, "n_functions": 11, "n_function_overloads": 11, "n_function_params": 25, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/third_party/triton_kernels/numerics_details/mxfp.py", "symbol_reports": [ { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.mxfp.downcast_to_mxfp_torch", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.mxfp.upcast_from_mxfp_torch", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.mxfp.upcast_from_mxfp", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.numerics_details.mxfp.DequantScaleRoundingMode", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DequantScaleRoundingMode.ROUND_UP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DequantScaleRoundingMode.ROUND_DOWN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.mxfp.right_shift_unsigned", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.mxfp.downcast_to_mxfp", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.mxfp.get_max_quant_val", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.numerics_details.mxfp.cvt_e2m1_to_fp32", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.third_party.triton_kernels.numerics_details.mxfp", "names": [ "vllm.third_party.triton_kernels.numerics_details.mxfp.DequantScaleRoundingMode", "vllm.third_party.triton_kernels.numerics_details.mxfp.cvt_e2m1_to_fp32", "vllm.third_party.triton_kernels.numerics_details.mxfp.downcast_to_mxfp", "vllm.third_party.triton_kernels.numerics_details.mxfp.downcast_to_mxfp_torch", "vllm.third_party.triton_kernels.numerics_details.mxfp.get_max_quant_val", "vllm.third_party.triton_kernels.numerics_details.mxfp.right_shift_unsigned", "vllm.third_party.triton_kernels.numerics_details.mxfp.upcast_from_mxfp", "vllm.third_party.triton_kernels.numerics_details.mxfp.upcast_from_mxfp_torch" ], "n_typable": 27, "n_typed": 17, "n_any": 0, "n_untyped": 10, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 20, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/third_party/triton_kernels/proton_opts.py", "symbol_reports": [ { "kind": "function", "name": "vllm.third_party.triton_kernels.proton_opts.set_launch_metadata_allow_sync", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.proton_opts.launch_metadata_allow_sync", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.third_party.triton_kernels.proton_opts", "names": [ "vllm.third_party.triton_kernels.proton_opts.launch_metadata_allow_sync", "vllm.third_party.triton_kernels.proton_opts.set_launch_metadata_allow_sync" ], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/third_party/triton_kernels/reduce.py", "symbol_reports": [ { "kind": "function", "name": "vllm.third_party.triton_kernels.reduce.reduce", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.reduce.PostprocessFn", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PostprocessFn.specs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PostprocessFn.fn_args", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.reduce.reduce_torch", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.reduce.compute_actual_scale", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.reduce.specializations", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.third_party.triton_kernels.reduce", "names": [ "vllm.third_party.triton_kernels.reduce.PostprocessFn", "vllm.third_party.triton_kernels.reduce.compute_actual_scale", "vllm.third_party.triton_kernels.reduce.reduce", "vllm.third_party.triton_kernels.reduce.reduce_torch", "vllm.third_party.triton_kernels.reduce.specializations" ], "n_typable": 29, "n_typed": 23, "n_any": 0, "n_untyped": 6, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 25, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/third_party/triton_kernels/roofline.py", "symbol_reports": [ { "kind": "class", "name": "vllm.third_party.triton_kernels.roofline.PerfRecord", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PerfRecord.time_ns", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PerfRecord.flops", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PerfRecord.bytes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.roofline.write_csv", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.roofline.parse_profile", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.roofline.load_perf_csv", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.roofline.compute_roofline", "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.roofline.get_cublas_tflops", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.roofline.plot_roofline", "n_typed": 0, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.roofline.parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.roofline.args", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.roofline.validate_perfs", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.roofline.get_memset_tbps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.third_party.triton_kernels.roofline", "names": [ "vllm.third_party.triton_kernels.roofline.PerfRecord", "vllm.third_party.triton_kernels.roofline.args", "vllm.third_party.triton_kernels.roofline.compute_roofline", "vllm.third_party.triton_kernels.roofline.get_cublas_tflops", "vllm.third_party.triton_kernels.roofline.get_memset_tbps", "vllm.third_party.triton_kernels.roofline.load_perf_csv", "vllm.third_party.triton_kernels.roofline.parse_profile", "vllm.third_party.triton_kernels.roofline.parser", "vllm.third_party.triton_kernels.roofline.plot_roofline", "vllm.third_party.triton_kernels.roofline.validate_perfs", "vllm.third_party.triton_kernels.roofline.write_csv" ], "n_typable": 34, "n_typed": 0, "n_any": 0, "n_untyped": 34, "n_functions": 8, "n_function_overloads": 8, "n_function_params": 24, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/third_party/triton_kernels/specialize.py", "symbol_reports": [ { "kind": "class", "name": "vllm.third_party.triton_kernels.specialize.ClosureArg", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ClosureArg.fn_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ClosureArg.fn_params_name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.specialize.specialize", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.specialize.SpecializationModule", "methods": [ { "kind": "function", "name": "SpecializationModule.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SpecializationModule.get", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SpecializationModule.module_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecializationModule.kernels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecializationModule.closure_args", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 3, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.specialize.cacheable", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.specialize.define_kernel", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.specialize.FnSpecs", "methods": [ { "kind": "function", "name": "FnSpecs.default", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FnSpecs.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FnSpecs.fn", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FnSpecs.fn_arg_names", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FnSpecs.fn_arg_do_not_specialize", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FnSpecs.reduction_n", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.third_party.triton_kernels.specialize", "names": [ "vllm.third_party.triton_kernels.specialize.ClosureArg", "vllm.third_party.triton_kernels.specialize.FnSpecs", "vllm.third_party.triton_kernels.specialize.SpecializationModule", "vllm.third_party.triton_kernels.specialize.cacheable", "vllm.third_party.triton_kernels.specialize.define_kernel", "vllm.third_party.triton_kernels.specialize.specialize" ], "n_typable": 24, "n_typed": 3, "n_any": 0, "n_untyped": 21, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 11, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_classes": 3, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/third_party/triton_kernels/swiglu.py", "symbol_reports": [ { "kind": "function", "name": "vllm.third_party.triton_kernels.swiglu.swiglu_torch", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.swiglu.PrecisionConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PrecisionConfig.limit", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrecisionConfig.flex_ctx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.swiglu.swiglu", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.swiglu.SwiGLU", "methods": [ { "kind": "function", "name": "SwiGLU.forward", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.swiglu.FlexCtx", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FlexCtx.out_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexCtx.inp_data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexCtx.saturate_inf", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.third_party.triton_kernels.swiglu", "names": [ "vllm.third_party.triton_kernels.swiglu.FlexCtx", "vllm.third_party.triton_kernels.swiglu.PrecisionConfig", "vllm.third_party.triton_kernels.swiglu.SwiGLU", "vllm.third_party.triton_kernels.swiglu.swiglu", "vllm.third_party.triton_kernels.swiglu.swiglu_torch" ], "n_typable": 15, "n_typed": 0, "n_any": 0, "n_untyped": 15, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 7, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_classes": 3, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/third_party/triton_kernels/target_info.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.third_party.triton_kernels.target_info.is_hip_cdna3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.target_info.is_cuda", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.target_info.num_sms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.target_info.is_hip", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.target_info.has_native_mxfp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.target_info.is_hip_cdna4", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.target_info.get_cdna_version", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.target_info.cuda_capability_geq", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.target_info.has_tma_gather", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.third_party.triton_kernels.target_info", "names": [ "vllm.third_party.triton_kernels.target_info.cuda_capability_geq", "vllm.third_party.triton_kernels.target_info.get_cdna_version", "vllm.third_party.triton_kernels.target_info.has_native_mxfp", "vllm.third_party.triton_kernels.target_info.has_tma_gather", "vllm.third_party.triton_kernels.target_info.is_cuda", "vllm.third_party.triton_kernels.target_info.is_hip", "vllm.third_party.triton_kernels.target_info.is_hip_cdna3", "vllm.third_party.triton_kernels.target_info.is_hip_cdna4", "vllm.third_party.triton_kernels.target_info.num_sms" ], "n_typable": 4, "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/third_party/triton_kernels/tensor.py", "symbol_reports": [ { "kind": "class", "name": "vllm.third_party.triton_kernels.tensor.FloatType", "methods": [ { "kind": "function", "name": "FloatType.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FloatType.bitwidth_exponent", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FloatType.bitwidth_mantissa", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FloatType.is_signed", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.tensor.SparseMatrix", "methods": [ { "kind": "function", "name": "SparseMatrix.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SparseMatrix.indx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SparseMatrix.vals", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SparseMatrix.mask", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.tensor.bitwidth", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.tensor.Tensor", "methods": [ { "kind": "function", "name": "Tensor.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Tensor.stride", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Tensor.data_ptr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Tensor.numel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Tensor.element_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Tensor.dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Tensor.size", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Tensor.ndim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "Tensor.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "Tensor.data", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Tensor.storage", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Tensor.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Tensor.shape", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Tensor.shape_max", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 12, "n_typed": 0, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 2, "n_attrs": 4, "n_properties": 3 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.tensor.convert_layout", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.tensor.Bitmatrix", "methods": [ { "kind": "function", "name": "Bitmatrix.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.tensor.wrap_torch_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.tensor.Storage", "methods": [ { "kind": "function", "name": "Storage.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Storage.is_tma_compliant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Storage.make_dense_tma", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Storage.make_tma", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "Storage.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Storage.data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Storage.layout", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 10, "n_typed": 0, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 2, "n_properties": 1 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.tensor.RaggedTensor", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RaggedTensor.slice_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RaggedTensor.data", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RaggedTensor.metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.tensor.IntegerType", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "IntegerType.bitwidth", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.tensor.BIT", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.third_party.triton_kernels.tensor.FP4", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.tensor.get_layout", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.third_party.triton_kernels.tensor", "names": [ "vllm.third_party.triton_kernels.tensor.BIT", "vllm.third_party.triton_kernels.tensor.Bitmatrix", "vllm.third_party.triton_kernels.tensor.FP4", "vllm.third_party.triton_kernels.tensor.FloatType", "vllm.third_party.triton_kernels.tensor.IntegerType", "vllm.third_party.triton_kernels.tensor.RaggedTensor", "vllm.third_party.triton_kernels.tensor.SparseMatrix", "vllm.third_party.triton_kernels.tensor.Storage", "vllm.third_party.triton_kernels.tensor.Tensor", "vllm.third_party.triton_kernels.tensor.bitwidth", "vllm.third_party.triton_kernels.tensor.convert_layout", "vllm.third_party.triton_kernels.tensor.get_layout", "vllm.third_party.triton_kernels.tensor.wrap_torch_tensor" ], "n_typable": 38, "n_typed": 4, "n_any": 0, "n_untyped": 34, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 7, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 7, "n_classes": 7, "n_attrs": 18, "n_properties": 4, "n_type_ignores": 0 }, { "path": "vllm/third_party/triton_kernels/testing.py", "symbol_reports": [ { "kind": "function", "name": "vllm.third_party.triton_kernels.testing.assert_equal", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.testing.ComputeSanitizerTool", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ComputeSanitizerTool.MEMCHECK", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ComputeSanitizerTool.RACECHECK", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ComputeSanitizerTool.SYNCCHECK", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ComputeSanitizerTool.INITCHECK", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.testing.compute_sanitizer", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.testing.assert_close", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.testing.compute_actual_scale", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.third_party.triton_kernels.testing", "names": [ "vllm.third_party.triton_kernels.testing.ComputeSanitizerTool", "vllm.third_party.triton_kernels.testing.assert_close", "vllm.third_party.triton_kernels.testing.assert_equal", "vllm.third_party.triton_kernels.testing.compute_actual_scale", "vllm.third_party.triton_kernels.testing.compute_sanitizer" ], "n_typable": 16, "n_typed": 0, "n_any": 0, "n_untyped": 16, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 12, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/third_party/triton_kernels/topk.py", "symbol_reports": [ { "kind": "function", "name": "vllm.third_party.triton_kernels.topk.make_empty", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.topk.topk_forward", "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "class", "name": "vllm.third_party.triton_kernels.topk.TopK", "methods": [ { "kind": "function", "name": "TopK.forward", "n_typed": 0, "n_any": 0, "n_untyped": 9, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "TopK.backward", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 14, "n_typed": 0, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.topk.topk_torch", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.topk.topk_backward", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.third_party.triton_kernels.topk.topk", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "type_ignores": [], "name": "vllm.third_party.triton_kernels.topk", "names": [ "vllm.third_party.triton_kernels.topk.TopK", "vllm.third_party.triton_kernels.topk.make_empty", "vllm.third_party.triton_kernels.topk.topk", "vllm.third_party.triton_kernels.topk.topk_backward", "vllm.third_party.triton_kernels.topk.topk_forward", "vllm.third_party.triton_kernels.topk.topk_torch" ], "n_typable": 50, "n_typed": 12, "n_any": 0, "n_untyped": 38, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 31, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 12, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tokenizers/registry.py", "symbol_reports": [ { "kind": "function", "name": "vllm.tokenizers.registry.cached_tokenizer_from_config", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.tokenizers.registry.TokenizerRegistry", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.tokenizers.registry.get_tokenizer", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "attr", "name": "vllm.tokenizers.registry.cached_get_tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.tokenizers.registry.resolve_tokenizer_args", "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.tokenizers.registry.tokenizer_args_from_config", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.tokenizers.registry.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tokenizers.registry.cached_resolve_tokenizer_args", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tokenizers.registry", "names": [ "vllm.tokenizers.registry.TokenizerRegistry", "vllm.tokenizers.registry.cached_get_tokenizer", "vllm.tokenizers.registry.cached_resolve_tokenizer_args", "vllm.tokenizers.registry.cached_tokenizer_from_config", "vllm.tokenizers.registry.get_tokenizer", "vllm.tokenizers.registry.logger", "vllm.tokenizers.registry.resolve_tokenizer_args", "vllm.tokenizers.registry.tokenizer_args_from_config" ], "n_typable": 24, "n_typed": 11, "n_any": 0, "n_untyped": 13, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 16, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tokenizers/protocol.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tokenizers.protocol.TokenizerLike", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.tokenizers.protocol", "names": [ "vllm.tokenizers.protocol.TokenizerLike" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tokenizers/deepseek_v32.py", "symbol_reports": [ { "kind": "function", "name": "vllm.tokenizers.deepseek_v32.get_deepseek_v32_tokenizer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.tokenizers.deepseek_v32.DeepseekV32Tokenizer", "methods": [ { "kind": "function", "name": "DeepseekV32Tokenizer.from_pretrained", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.tokenizers.deepseek_v32", "names": [ "vllm.tokenizers.deepseek_v32.DeepseekV32Tokenizer", "vllm.tokenizers.deepseek_v32.get_deepseek_v32_tokenizer" ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tokenizers/deepseek_v32_encoding.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.tokenizers.deepseek_v32_encoding.thinking_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.tokenizers.deepseek_v32_encoding.tool_calls_to_openai_format", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.tokenizers.deepseek_v32_encoding.user_msg_template", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.tokenizers.deepseek_v32_encoding.tool_calls_from_openai_format", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.tokenizers.deepseek_v32_encoding.bos_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tokenizers.deepseek_v32_encoding.assistant_msg_template", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tokenizers.deepseek_v32_encoding.tool_calls_template", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.tokenizers.deepseek_v32_encoding.eos_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.tokenizers.deepseek_v32_encoding.render_message", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.tokenizers.deepseek_v32_encoding.response_format_template", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tokenizers.deepseek_v32_encoding.tool_output_template", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.tokenizers.deepseek_v32_encoding.decode_dsml_to_arguments", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.tokenizers.deepseek_v32_encoding.dsml_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.tokenizers.deepseek_v32_encoding.parse_tool_calls", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.tokenizers.deepseek_v32_encoding.thinking_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tokenizers.deepseek_v32_encoding.system_msg_template", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.tokenizers.deepseek_v32_encoding.encode_arguments_to_dsml", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.tokenizers.deepseek_v32_encoding.thinking_template", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.tokenizers.deepseek_v32_encoding.find_last_user_index", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.tokenizers.deepseek_v32_encoding.tool_call_template", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tokenizers.deepseek_v32_encoding.TOOLS_SYSTEM_TEMPLATE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.tokenizers.deepseek_v32_encoding.drop_thinking_messages", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.tokenizers.deepseek_v32_encoding.parse_message_from_completion_text", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.tokenizers.deepseek_v32_encoding.to_json", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.tokenizers.deepseek_v32_encoding.render_tools", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.tokenizers.deepseek_v32_encoding.tools_from_openai_format", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.tokenizers.deepseek_v32_encoding.encode_messages", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.tokenizers.deepseek_v32_encoding", "names": [ "vllm.tokenizers.deepseek_v32_encoding.TOOLS_SYSTEM_TEMPLATE", "vllm.tokenizers.deepseek_v32_encoding.assistant_msg_template", "vllm.tokenizers.deepseek_v32_encoding.bos_token", "vllm.tokenizers.deepseek_v32_encoding.decode_dsml_to_arguments", "vllm.tokenizers.deepseek_v32_encoding.drop_thinking_messages", "vllm.tokenizers.deepseek_v32_encoding.dsml_token", "vllm.tokenizers.deepseek_v32_encoding.encode_arguments_to_dsml", "vllm.tokenizers.deepseek_v32_encoding.encode_messages", "vllm.tokenizers.deepseek_v32_encoding.eos_token", "vllm.tokenizers.deepseek_v32_encoding.find_last_user_index", "vllm.tokenizers.deepseek_v32_encoding.parse_message_from_completion_text", "vllm.tokenizers.deepseek_v32_encoding.parse_tool_calls", "vllm.tokenizers.deepseek_v32_encoding.render_message", "vllm.tokenizers.deepseek_v32_encoding.render_tools", "vllm.tokenizers.deepseek_v32_encoding.response_format_template", "vllm.tokenizers.deepseek_v32_encoding.system_msg_template", "vllm.tokenizers.deepseek_v32_encoding.thinking_end_token", "vllm.tokenizers.deepseek_v32_encoding.thinking_start_token", "vllm.tokenizers.deepseek_v32_encoding.thinking_template", "vllm.tokenizers.deepseek_v32_encoding.to_json", "vllm.tokenizers.deepseek_v32_encoding.tool_call_template", "vllm.tokenizers.deepseek_v32_encoding.tool_calls_from_openai_format", "vllm.tokenizers.deepseek_v32_encoding.tool_calls_template", "vllm.tokenizers.deepseek_v32_encoding.tool_calls_to_openai_format", "vllm.tokenizers.deepseek_v32_encoding.tool_output_template", "vllm.tokenizers.deepseek_v32_encoding.tools_from_openai_format", "vllm.tokenizers.deepseek_v32_encoding.user_msg_template" ], "n_typable": 47, "n_typed": 38, "n_any": 1, "n_untyped": 8, "n_functions": 13, "n_function_overloads": 13, "n_function_params": 23, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 14, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tokenizers/detokenizer_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.tokenizers.detokenizer_utils.convert_ids_list_to_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.tokenizers.detokenizer_utils.detokenize_incrementally", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.tokenizers.detokenizer_utils.convert_prompt_ids_to_tokens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.tokenizers.detokenizer_utils.INITIAL_INCREMENTAL_DETOKENIZATION_OFFSET", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.tokenizers.detokenizer_utils", "names": [ "vllm.tokenizers.detokenizer_utils.INITIAL_INCREMENTAL_DETOKENIZATION_OFFSET", "vllm.tokenizers.detokenizer_utils.convert_ids_list_to_tokens", "vllm.tokenizers.detokenizer_utils.convert_prompt_ids_to_tokens", "vllm.tokenizers.detokenizer_utils.detokenize_incrementally" ], "n_typable": 15, "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 12, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tokenizers/grok2.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.tokenizers.grok2.PAD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.tokenizers.grok2.RESERVED_TOKEN_TEXTS", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tokenizers.grok2.SEP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.tokenizers.grok2.Grok2Tokenizer", "methods": [ { "kind": "function", "name": "Grok2Tokenizer.from_pretrained", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Grok2Tokenizer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Grok2Tokenizer.num_special_tokens_to_add", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Grok2Tokenizer.get_vocab", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Grok2Tokenizer.get_added_vocab", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Grok2Tokenizer._maybe_truncate", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Grok2Tokenizer.encode", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Grok2Tokenizer.decode", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Grok2Tokenizer.convert_tokens_to_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "function", "name": "Grok2Tokenizer.convert_ids_to_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Grok2Tokenizer.convert_tokens_to_string", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Grok2Tokenizer.__call__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Grok2Tokenizer.get_chat_template", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Grok2Tokenizer.apply_chat_template", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [ { "kind": "property", "name": "Grok2Tokenizer.all_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Grok2Tokenizer.all_special_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Grok2Tokenizer.bos_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Grok2Tokenizer.eos_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Grok2Tokenizer.pad_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Grok2Tokenizer.is_fast", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Grok2Tokenizer.vocab_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Grok2Tokenizer.max_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Grok2Tokenizer.max_chars_per_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Grok2Tokenizer.truncation_side", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Grok2Tokenizer.name_or_path", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Grok2Tokenizer.init_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 61, "n_typed": 56, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 15, "n_method_params": 35, "n_attrs": 2, "n_properties": 10 }, { "kind": "attr", "name": "vllm.tokenizers.grok2.DEFAULT_CHAT_TEMPLATE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.tokenizers.grok2.EOS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.tokenizers.grok2.PAT_STR_B", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.tokenizers.grok2.DEFAULT_SPECIAL_TOKENS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.tokenizers.grok2.CONTROL_TOKEN_TEXTS", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tokenizers.grok2.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tokenizers.grok2.DEFAULT_CONTROL_TOKENS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.tokenizers.grok2", "names": [ "vllm.tokenizers.grok2.CONTROL_TOKEN_TEXTS", "vllm.tokenizers.grok2.DEFAULT_CHAT_TEMPLATE", "vllm.tokenizers.grok2.DEFAULT_CONTROL_TOKENS", "vllm.tokenizers.grok2.DEFAULT_SPECIAL_TOKENS", "vllm.tokenizers.grok2.EOS", "vllm.tokenizers.grok2.Grok2Tokenizer", "vllm.tokenizers.grok2.PAD", "vllm.tokenizers.grok2.PAT_STR_B", "vllm.tokenizers.grok2.RESERVED_TOKEN_TEXTS", "vllm.tokenizers.grok2.SEP", "vllm.tokenizers.grok2.logger" ], "n_typable": 64, "n_typed": 56, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 15, "n_method_params": 35, "n_classes": 1, "n_attrs": 12, "n_properties": 10, "n_type_ignores": 0 }, { "path": "vllm/tokenizers/hf.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tokenizers.hf.CachedHfTokenizer", "methods": [ { "kind": "function", "name": "CachedHfTokenizer.from_pretrained", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.tokenizers.hf.get_cached_tokenizer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.tokenizers.hf.HfTokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tokenizers.hf", "names": [ "vllm.tokenizers.hf.CachedHfTokenizer", "vllm.tokenizers.hf.HfTokenizer", "vllm.tokenizers.hf.get_cached_tokenizer" ], "n_typable": 10, "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tokenizers/mistral.py", "symbol_reports": [ { "kind": "function", "name": "vllm.tokenizers.mistral.validate_request_params", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.tokenizers.mistral.MistralTokenizer", "methods": [ { "kind": "function", "name": "MistralTokenizer.from_pretrained", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "MistralTokenizer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MistralTokenizer._get_special_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MistralTokenizer._get_special_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MistralTokenizer.num_special_tokens_to_add", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MistralTokenizer._is_special_token_id", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MistralTokenizer.__hash__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MistralTokenizer.__len__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MistralTokenizer.__call__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MistralTokenizer.get_vocab", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MistralTokenizer.get_added_vocab", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MistralTokenizer.encode", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MistralTokenizer.apply_chat_template", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MistralTokenizer.decode", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MistralTokenizer.batch_decode", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MistralTokenizer.convert_tokens_to_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "function", "name": "MistralTokenizer.convert_tokens_to_string", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MistralTokenizer.convert_ids_to_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "MistralTokenizer.all_special_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MistralTokenizer.all_special_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MistralTokenizer.bos_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MistralTokenizer.eos_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MistralTokenizer.pad_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MistralTokenizer.is_fast", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MistralTokenizer.vocab_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MistralTokenizer.max_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MistralTokenizer.max_chars_per_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MistralTokenizer.truncation_side", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "MistralTokenizer.vocab", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MistralTokenizer.IS_MISTRAL_TOKENIZER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MistralTokenizer.transformers_tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MistralTokenizer.mistral", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MistralTokenizer.instruct", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MistralTokenizer.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MistralTokenizer.version", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MistralTokenizer.is_tekken", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MistralTokenizer.is_spm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 65, "n_typed": 56, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 19, "n_method_params": 29, "n_attrs": 8, "n_properties": 11 }, { "kind": "function", "name": "vllm.tokenizers.mistral.maybe_serialize_tool_calls", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.tokenizers.mistral.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.tokenizers.mistral.truncate_tool_call_ids", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.tokenizers.mistral", "names": [ "vllm.tokenizers.mistral.MistralTokenizer", "vllm.tokenizers.mistral.logger", "vllm.tokenizers.mistral.maybe_serialize_tool_calls", "vllm.tokenizers.mistral.truncate_tool_call_ids", "vllm.tokenizers.mistral.validate_request_params" ], "n_typable": 72, "n_typed": 59, "n_any": 0, "n_untyped": 13, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 3, "n_methods": 18, "n_method_overloads": 19, "n_method_params": 29, "n_classes": 1, "n_attrs": 9, "n_properties": 11, "n_type_ignores": 0 }, { "path": "vllm/tokenizers/qwen_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tokenizers.qwen_vl.QwenVLTokenizer", "methods": [ { "kind": "function", "name": "QwenVLTokenizer.from_pretrained", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.tokenizers.qwen_vl.get_qwen_vl_tokenizer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.tokenizers.qwen_vl", "names": [ "vllm.tokenizers.qwen_vl.QwenVLTokenizer", "vllm.tokenizers.qwen_vl.get_qwen_vl_tokenizer" ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/abstract_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.abstract_tool_parser.ToolParserManager", "methods": [ { "kind": "function", "name": "ToolParserManager.get_tool_parser", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ToolParserManager._load_lazy_parser", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ToolParserManager._register_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ToolParserManager.register_lazy_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ToolParserManager.register_module", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ToolParserManager.list_registered", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ToolParserManager.import_tool_parser", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ToolParserManager.tool_parsers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ToolParserManager.lazy_parsers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 21, "n_typed": 21, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 12, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.tool_parsers.abstract_tool_parser.ToolParser", "methods": [ { "kind": "function", "name": "ToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ToolParser.adjust_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [ { "kind": "property", "name": "ToolParser.vocab", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ToolParser.current_tool_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ToolParser.current_tool_name_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ToolParser.model_tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 19, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 5, "n_properties": 1 }, { "kind": "attr", "name": "vllm.tool_parsers.abstract_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.abstract_tool_parser", "names": [ "vllm.tool_parsers.abstract_tool_parser.ToolParser", "vllm.tool_parsers.abstract_tool_parser.ToolParserManager", "vllm.tool_parsers.abstract_tool_parser.logger" ], "n_typable": 43, "n_typed": 40, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 23, "n_classes": 2, "n_attrs": 8, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/deepseekv31_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.deepseekv31_tool_parser.DeepSeekV31ToolParser", "methods": [ { "kind": "function", "name": "DeepSeekV31ToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepSeekV31ToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepSeekV31ToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepSeekV31ToolParser.current_tool_name_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV31ToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV31ToolParser.current_tool_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV31ToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV31ToolParser.tool_calls_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV31ToolParser.tool_calls_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV31ToolParser.tool_call_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV31ToolParser.tool_call_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV31ToolParser.tool_call_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV31ToolParser.stream_tool_call_portion_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV31ToolParser.stream_tool_call_name_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV31ToolParser.tool_calls_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV31ToolParser.tool_calls_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV31ToolParser.tool_call_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV31ToolParser.tool_call_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 20, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 15, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.deepseekv31_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.deepseekv31_tool_parser", "names": [ "vllm.tool_parsers.deepseekv31_tool_parser.DeepSeekV31ToolParser", "vllm.tool_parsers.deepseekv31_tool_parser.logger" ], "n_typable": 29, "n_typed": 20, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_classes": 1, "n_attrs": 16, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/deepseekv32_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.deepseekv32_tool_parser.DeepSeekV32ToolParser", "methods": [ { "kind": "function", "name": "DeepSeekV32ToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepSeekV32ToolParser._generate_tool_call_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepSeekV32ToolParser.adjust_request", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepSeekV32ToolParser._reset_streaming_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepSeekV32ToolParser._parse_invoke_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepSeekV32ToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepSeekV32ToolParser._extract_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepSeekV32ToolParser._extract_param_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepSeekV32ToolParser._convert_param_value", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepSeekV32ToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepSeekV32ToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.dsml_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.dsml_start_check", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.tool_call_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.tool_call_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.invoke_start_prefix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.invoke_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.parameter_prefix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.parameter_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.current_tool_name_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.current_tool_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.is_tool_call_started", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.failed_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.current_tool_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.invoke_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.header_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.current_function_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.current_param_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.current_param_value", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.param_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.in_param", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.in_function", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.json_started", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.json_closed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.accumulated_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.streaming_request", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.tool_call_complete_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.invoke_complete_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV32ToolParser.parameter_complete_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 56, "n_typed": 48, "n_any": 1, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 16, "n_attrs": 30, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.deepseekv32_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.deepseekv32_tool_parser", "names": [ "vllm.tool_parsers.deepseekv32_tool_parser.DeepSeekV32ToolParser", "vllm.tool_parsers.deepseekv32_tool_parser.logger" ], "n_typable": 57, "n_typed": 48, "n_any": 1, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 16, "n_classes": 1, "n_attrs": 31, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/deepseekv3_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.deepseekv3_tool_parser.DeepSeekV3ToolParser", "methods": [ { "kind": "function", "name": "DeepSeekV3ToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepSeekV3ToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepSeekV3ToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepSeekV3ToolParser.current_tool_name_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV3ToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV3ToolParser.current_tool_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV3ToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV3ToolParser.tool_calls_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV3ToolParser.tool_calls_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV3ToolParser.tool_call_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV3ToolParser.tool_call_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV3ToolParser.tool_call_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV3ToolParser.stream_tool_call_portion_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV3ToolParser.stream_tool_call_name_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV3ToolParser.tool_calls_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV3ToolParser.tool_calls_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV3ToolParser.tool_call_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepSeekV3ToolParser.tool_call_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 20, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 15, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.deepseekv3_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.deepseekv3_tool_parser", "names": [ "vllm.tool_parsers.deepseekv3_tool_parser.DeepSeekV3ToolParser", "vllm.tool_parsers.deepseekv3_tool_parser.logger" ], "n_typable": 29, "n_typed": 20, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_classes": 1, "n_attrs": 16, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/ernie45_tool_parser.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.tool_parsers.ernie45_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.tool_parsers.ernie45_tool_parser.Ernie45ToolParser", "methods": [ { "kind": "function", "name": "Ernie45ToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ernie45ToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ernie45ToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Ernie45ToolParser.current_tool_name_sent", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.current_tool_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.think_end_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.response_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.response_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.tool_call_start_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.tool_call_end_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.tool_calls_start_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.newline_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.tool_call_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.think_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.response_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.response_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.tool_call_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.tool_call_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.newline_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ernie45ToolParser.parser_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 17, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 19, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.tool_parsers.ernie45_tool_parser", "names": [ "vllm.tool_parsers.ernie45_tool_parser.Ernie45ToolParser", "vllm.tool_parsers.ernie45_tool_parser.logger" ], "n_typable": 33, "n_typed": 17, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_classes": 1, "n_attrs": 20, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/functiongemma_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.functiongemma_tool_parser.FunctionGemmaToolParser", "methods": [ { "kind": "function", "name": "FunctionGemmaToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunctionGemmaToolParser._parse_arguments", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunctionGemmaToolParser.adjust_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunctionGemmaToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FunctionGemmaToolParser._buffer_delta_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FunctionGemmaToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FunctionGemmaToolParser.current_tool_name_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FunctionGemmaToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FunctionGemmaToolParser.current_tool_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FunctionGemmaToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FunctionGemmaToolParser.tool_call_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FunctionGemmaToolParser.tool_call_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FunctionGemmaToolParser.tool_call_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunctionGemmaToolParser.arg_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunctionGemmaToolParser.buffered_delta_text", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunctionGemmaToolParser.tool_call_start_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunctionGemmaToolParser.tool_call_end_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 24, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 13, "n_attrs": 11, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.functiongemma_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.functiongemma_tool_parser", "names": [ "vllm.tool_parsers.functiongemma_tool_parser.FunctionGemmaToolParser", "vllm.tool_parsers.functiongemma_tool_parser.logger" ], "n_typable": 31, "n_typed": 24, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 13, "n_classes": 1, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/gigachat3_tool_parser.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.tool_parsers.gigachat3_tool_parser.REGEX_FUNCTION_CALL", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tool_parsers.gigachat3_tool_parser.ARGS_REGEX", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.tool_parsers.gigachat3_tool_parser.GigaChat3ToolParser", "methods": [ { "kind": "function", "name": "GigaChat3ToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GigaChat3ToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GigaChat3ToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GigaChat3ToolParser.tool_started", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GigaChat3ToolParser.tool_name_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GigaChat3ToolParser.tool_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GigaChat3ToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GigaChat3ToolParser.content_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GigaChat3ToolParser.trigger_start", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 17, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.gigachat3_tool_parser.NAME_REGEX", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tool_parsers.gigachat3_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.gigachat3_tool_parser", "names": [ "vllm.tool_parsers.gigachat3_tool_parser.ARGS_REGEX", "vllm.tool_parsers.gigachat3_tool_parser.GigaChat3ToolParser", "vllm.tool_parsers.gigachat3_tool_parser.NAME_REGEX", "vllm.tool_parsers.gigachat3_tool_parser.REGEX_FUNCTION_CALL", "vllm.tool_parsers.gigachat3_tool_parser.logger" ], "n_typable": 23, "n_typed": 17, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_classes": 1, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/glm47_moe_tool_parser.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.tool_parsers.glm47_moe_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.tool_parsers.glm47_moe_tool_parser.Glm47MoeModelToolParser", "methods": [ { "kind": "function", "name": "Glm47MoeModelToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm47MoeModelToolParser.func_detail_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm47MoeModelToolParser.func_arg_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 4, "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.tool_parsers.glm47_moe_tool_parser", "names": [ "vllm.tool_parsers.glm47_moe_tool_parser.Glm47MoeModelToolParser", "vllm.tool_parsers.glm47_moe_tool_parser.logger" ], "n_typable": 5, "n_typed": 1, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/glm4_moe_tool_parser.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.tool_parsers.glm4_moe_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.tool_parsers.glm4_moe_tool_parser.Glm4MoeModelToolParser", "methods": [ { "kind": "function", "name": "Glm4MoeModelToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeModelToolParser._deserialize", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeModelToolParser._json_escape_string_content", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeModelToolParser._is_string_type", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Glm4MoeModelToolParser._tools_enabled", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeModelToolParser.adjust_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeModelToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4MoeModelToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Glm4MoeModelToolParser._ensure_tool_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Glm4MoeModelToolParser._begin_tool_call", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Glm4MoeModelToolParser._finish_tool_call", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Glm4MoeModelToolParser._revert_last_tool_call_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Glm4MoeModelToolParser._emit_tool_name_delta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeModelToolParser._emit_tool_args_delta", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Glm4MoeModelToolParser._append_arg_fragment", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Glm4MoeModelToolParser._close_args_if_needed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Glm4MoeModelToolParser.current_tool_name_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModelToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModelToolParser.current_tool_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModelToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModelToolParser.tool_call_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModelToolParser.tool_call_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModelToolParser.arg_key_start", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModelToolParser.arg_key_end", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModelToolParser.arg_val_start", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModelToolParser.arg_val_end", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModelToolParser.tool_calls_start_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModelToolParser.func_call_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModelToolParser.func_detail_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModelToolParser.func_arg_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModelToolParser.tool_call_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Glm4MoeModelToolParser.tool_call_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 53, "n_typed": 45, "n_any": 1, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 21, "n_attrs": 16, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.tool_parsers.glm4_moe_tool_parser", "names": [ "vllm.tool_parsers.glm4_moe_tool_parser.Glm4MoeModelToolParser", "vllm.tool_parsers.glm4_moe_tool_parser.logger" ], "n_typable": 54, "n_typed": 45, "n_any": 1, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 21, "n_classes": 1, "n_attrs": 17, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/granite_20b_fc_tool_parser.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.tool_parsers.granite_20b_fc_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.tool_parsers.granite_20b_fc_tool_parser.Granite20bFCToolParser", "methods": [ { "kind": "function", "name": "Granite20bFCToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Granite20bFCToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Granite20bFCToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Granite20bFCToolParser.bot_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Granite20bFCToolParser.tool_start_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Granite20bFCToolParser.tool_call_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 12, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.tool_parsers.granite_20b_fc_tool_parser", "names": [ "vllm.tool_parsers.granite_20b_fc_tool_parser.Granite20bFCToolParser", "vllm.tool_parsers.granite_20b_fc_tool_parser.logger" ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/granite_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.granite_tool_parser.GraniteToolParser", "methods": [ { "kind": "function", "name": "GraniteToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GraniteToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GraniteToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GraniteToolParser.bot_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GraniteToolParser.bot_string", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 12, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.granite_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.granite_tool_parser", "names": [ "vllm.tool_parsers.granite_tool_parser.GraniteToolParser", "vllm.tool_parsers.granite_tool_parser.logger" ], "n_typable": 16, "n_typed": 12, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/hermes_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.hermes_tool_parser.Hermes2ProToolParser", "methods": [ { "kind": "function", "name": "Hermes2ProToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Hermes2ProToolParser.tool_call_delta_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Hermes2ProToolParser.adjust_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Hermes2ProToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Hermes2ProToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Hermes2ProToolParser.current_tool_name_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Hermes2ProToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Hermes2ProToolParser.current_tool_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Hermes2ProToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Hermes2ProToolParser.tool_call_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Hermes2ProToolParser.tool_call_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Hermes2ProToolParser.tool_call_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Hermes2ProToolParser.scratch_pad_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Hermes2ProToolParser.tool_call_start_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Hermes2ProToolParser.tool_call_end_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Hermes2ProToolParser.tool_call_start_token_array", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Hermes2ProToolParser.tool_call_end_token_array", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Hermes2ProToolParser.buffered_delta_text", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Hermes2ProToolParser.model_tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 21, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 14, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.hermes_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.hermes_tool_parser", "names": [ "vllm.tool_parsers.hermes_tool_parser.Hermes2ProToolParser", "vllm.tool_parsers.hermes_tool_parser.logger" ], "n_typable": 32, "n_typed": 21, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_classes": 1, "n_attrs": 15, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/hunyuan_a13b_tool_parser.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.tool_parsers.hunyuan_a13b_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.tool_parsers.hunyuan_a13b_tool_parser.HunyuanA13BToolParser", "methods": [ { "kind": "function", "name": "HunyuanA13BToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunyuanA13BToolParser.preprocess_model_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunyuanA13BToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunyuanA13BToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "HunyuanA13BToolParser._try_parse_json_tools", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunyuanA13BToolParser._handle_test_compatibility", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunyuanA13BToolParser._ensure_state_arrays", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "HunyuanA13BToolParser._handle_tool_name_streaming", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "HunyuanA13BToolParser._handle_tool_args_streaming", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunyuanA13BToolParser.prev_tool_calls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BToolParser.current_tool_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BToolParser.current_tool_name_sent", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BToolParser.streamed_args", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BToolParser.current_tools_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BToolParser.prev_tool_call_arr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BToolParser.answer_tool_calls_pattern", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BToolParser.tool_name_reg", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BToolParser.tool_empty_arg_reg", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BToolParser.tool_non_empty_arg_reg", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BToolParser.bot_string", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunyuanA13BToolParser.streaming_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 41, "n_typed": 26, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 20, "n_attrs": 12, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.tool_parsers.hunyuan_a13b_tool_parser", "names": [ "vllm.tool_parsers.hunyuan_a13b_tool_parser.HunyuanA13BToolParser", "vllm.tool_parsers.hunyuan_a13b_tool_parser.logger" ], "n_typable": 42, "n_typed": 26, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 20, "n_classes": 1, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/internlm2_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.internlm2_tool_parser.Internlm2ToolParser", "methods": [ { "kind": "function", "name": "Internlm2ToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Internlm2ToolParser.adjust_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Internlm2ToolParser.get_arguments", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Internlm2ToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Internlm2ToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Internlm2ToolParser.position", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 14, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.internlm2_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.internlm2_tool_parser", "names": [ "vllm.tool_parsers.internlm2_tool_parser.Internlm2ToolParser", "vllm.tool_parsers.internlm2_tool_parser.logger" ], "n_typable": 19, "n_typed": 14, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/jamba_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.jamba_tool_parser.JambaToolParser", "methods": [ { "kind": "function", "name": "JambaToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "JambaToolParser.adjust_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "JambaToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "JambaToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JambaToolParser.current_tool_name_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "JambaToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "JambaToolParser.current_tool_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "JambaToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "JambaToolParser.tool_calls_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "JambaToolParser.tool_calls_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "JambaToolParser.tool_calls_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaToolParser.tool_calls_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JambaToolParser.tool_calls_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 20, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 9, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.jamba_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.jamba_tool_parser", "names": [ "vllm.tool_parsers.jamba_tool_parser.JambaToolParser", "vllm.tool_parsers.jamba_tool_parser.logger" ], "n_typable": 25, "n_typed": 20, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_classes": 1, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/kimi_k2_tool_parser.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.tool_parsers.kimi_k2_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.tool_parsers.kimi_k2_tool_parser.KimiK2ToolParser", "methods": [ { "kind": "function", "name": "KimiK2ToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiK2ToolParser._check_and_strip_markers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KimiK2ToolParser._reset_section_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KimiK2ToolParser.reset_streaming_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KimiK2ToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KimiK2ToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiK2ToolParser.current_tool_name_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.current_tool_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.in_tool_section", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.token_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.buffer_max_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.section_char_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.max_section_chars", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.tool_calls_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.tool_calls_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.tool_calls_start_token_variants", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.tool_calls_end_token_variants", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.tool_call_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.tool_call_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.tool_call_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.stream_tool_call_portion_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.stream_tool_call_name_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.tool_calls_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.tool_calls_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.tool_calls_start_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.tool_calls_end_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.tool_call_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK2ToolParser.tool_call_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 41, "n_typed": 33, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 11, "n_attrs": 24, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.tool_parsers.kimi_k2_tool_parser", "names": [ "vllm.tool_parsers.kimi_k2_tool_parser.KimiK2ToolParser", "vllm.tool_parsers.kimi_k2_tool_parser.logger" ], "n_typable": 42, "n_typed": 33, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 11, "n_classes": 1, "n_attrs": 25, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/llama4_pythonic_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.llama4_pythonic_tool_parser.Llama4PythonicToolParser", "methods": [ { "kind": "function", "name": "Llama4PythonicToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Llama4PythonicToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Llama4PythonicToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [ { "kind": "property", "name": "Llama4PythonicToolParser.current_tool_index", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_typable": 2 } ], "attrs": [ { "kind": "attr", "name": "Llama4PythonicToolParser.TOOL_CALL_REGEX", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 14, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 1, "n_properties": 1 }, { "kind": "attr", "name": "vllm.tool_parsers.llama4_pythonic_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.llama4_pythonic_tool_parser", "names": [ "vllm.tool_parsers.llama4_pythonic_tool_parser.Llama4PythonicToolParser", "vllm.tool_parsers.llama4_pythonic_tool_parser.logger" ], "n_typable": 17, "n_typed": 14, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_classes": 1, "n_attrs": 2, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/llama_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.llama_tool_parser.Llama3JsonToolParser", "methods": [ { "kind": "function", "name": "Llama3JsonToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Llama3JsonToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Llama3JsonToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Llama3JsonToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Llama3JsonToolParser.current_tool_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Llama3JsonToolParser.current_tool_name_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Llama3JsonToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Llama3JsonToolParser.bot_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama3JsonToolParser.bot_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama3JsonToolParser.tool_call_start_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Llama3JsonToolParser.json_decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 16, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.llama_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.llama_tool_parser", "names": [ "vllm.tool_parsers.llama_tool_parser.Llama3JsonToolParser", "vllm.tool_parsers.llama_tool_parser.logger" ], "n_typable": 22, "n_typed": 16, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_classes": 1, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/longcat_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.longcat_tool_parser.LongcatFlashToolParser", "methods": [ { "kind": "function", "name": "LongcatFlashToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LongcatFlashToolParser.tool_call_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LongcatFlashToolParser.tool_call_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LongcatFlashToolParser.tool_call_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongcatFlashToolParser.tool_call_start_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongcatFlashToolParser.tool_call_end_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongcatFlashToolParser.tool_call_start_token_array", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LongcatFlashToolParser.tool_call_end_token_array", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 3, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.tool_parsers.longcat_tool_parser", "names": [ "vllm.tool_parsers.longcat_tool_parser.LongcatFlashToolParser" ], "n_typable": 9, "n_typed": 3, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/minimax_m2_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.minimax_m2_tool_parser.MinimaxM2ToolParser", "methods": [ { "kind": "function", "name": "MinimaxM2ToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxM2ToolParser._generate_tool_call_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MinimaxM2ToolParser._reset_streaming_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MinimaxM2ToolParser._extract_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxM2ToolParser._convert_param_value", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MinimaxM2ToolParser._extract_types_from_schema", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxM2ToolParser._convert_param_value_with_types", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MinimaxM2ToolParser._get_param_types_from_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MinimaxM2ToolParser._parse_single_invoke", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MinimaxM2ToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MinimaxM2ToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MinimaxM2ToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.tool_call_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.tool_call_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.invoke_start_prefix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.invoke_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.parameter_prefix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.parameter_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.current_tool_name_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.current_tool_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.is_tool_call_started", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.failed_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.current_tool_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.invoke_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.header_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.current_function_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.current_param_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.current_param_value", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.param_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.in_param", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.in_function", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.accumulated_text", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.json_started", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.json_closed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.accumulated_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.streaming_request", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.tool_call_complete_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.invoke_complete_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.parameter_complete_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.tool_call_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxM2ToolParser.tool_call_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 62, "n_typed": 52, "n_any": 3, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 20, "n_attrs": 31, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.minimax_m2_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.minimax_m2_tool_parser", "names": [ "vllm.tool_parsers.minimax_m2_tool_parser.MinimaxM2ToolParser", "vllm.tool_parsers.minimax_m2_tool_parser.logger" ], "n_typable": 63, "n_typed": 52, "n_any": 3, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 20, "n_classes": 1, "n_attrs": 32, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/minimax_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.minimax_tool_parser.MinimaxToolParser", "methods": [ { "kind": "function", "name": "MinimaxToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser.preprocess_model_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser._clean_duplicate_braces", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser._clean_delta_braces", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MinimaxToolParser._update_thinking_state", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser._is_potential_tag_start", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser._should_buffer_content", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser._split_content_for_buffering", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser._process_buffer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser._reset_streaming_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MinimaxToolParser._advance_to_next_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MinimaxToolParser._set_current_tool_index", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser._get_current_tool_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MinimaxToolParser._get_next_unsent_tool_index", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser._ensure_state_arrays", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser._detect_tools_in_text", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser._find_tool_boundaries", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser._extract_tool_args", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MinimaxToolParser._get_current_tool_content", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MinimaxToolParser._handle_tool_name_streaming", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MinimaxToolParser._handle_tool_args_streaming", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MinimaxToolParser._is_end_tool_calls", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "MinimaxToolParser._find_tool_start_outside_thinking", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinimaxToolParser._extract_content_before_tools", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MinimaxToolParser._extract_tool_content", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MinimaxToolParser.streaming_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxToolParser.tool_call_start_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxToolParser.tool_call_end_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxToolParser.tool_call_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxToolParser.thinking_tag_pattern", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxToolParser.tool_name_pattern", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxToolParser.tool_args_pattern", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxToolParser.pending_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxToolParser.in_thinking_tag", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxToolParser.tool_call_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinimaxToolParser.tool_call_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 76, "n_typed": 65, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 27, "n_method_overloads": 27, "n_method_params": 38, "n_attrs": 11, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.minimax_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.minimax_tool_parser", "names": [ "vllm.tool_parsers.minimax_tool_parser.MinimaxToolParser", "vllm.tool_parsers.minimax_tool_parser.logger" ], "n_typable": 77, "n_typed": 65, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 27, "n_method_overloads": 27, "n_method_params": 38, "n_classes": 1, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/mistral_tool_parser.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.tool_parsers.mistral_tool_parser.ALPHANUMERIC", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.tool_parsers.mistral_tool_parser.StreamingState", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "StreamingState.WAITING_FOR_TOOL_START", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingState.WAITING_FOR_TOOL_KEY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingState.PARSING_NAME", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingState.PARSING_NAME_COMPLETED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingState.WAITING_FOR_ARGUMENTS_START", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingState.PARSING_ARGUMENTS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingState.PARSING_ARGUMENTS_COMPLETED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingState.TOOL_COMPLETE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingState.ALL_TOOLS_COMPLETE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.tool_parsers.mistral_tool_parser.MistralToolParser", "methods": [ { "kind": "function", "name": "MistralToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MistralToolParser.adjust_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MistralToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MistralToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "MistralToolParser._extract_tool_calls_streaming", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MistralToolParser._generate_delta_tool_call", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MistralToolParser.update_stream_state_pre_v11_tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MistralToolParser._extract_tool_calls_streaming_pre_v11_tokenizer", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MistralToolParser._split_delta", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MistralToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MistralToolParser.current_tool_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MistralToolParser.streaming_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MistralToolParser.current_tool_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MistralToolParser.current_tool_mistral_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MistralToolParser.starting_new_tool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MistralToolParser.bot_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MistralToolParser.bot_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MistralToolParser.tool_call_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MistralToolParser.parse_coro", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 42, "n_typed": 34, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 23, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.mistral_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.tool_parsers.mistral_tool_parser.MistralToolCall", "methods": [ { "kind": "function", "name": "MistralToolCall.generate_random_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MistralToolCall.is_valid_id", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MistralToolCall.id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.tool_parsers.mistral_tool_parser", "names": [ "vllm.tool_parsers.mistral_tool_parser.ALPHANUMERIC", "vllm.tool_parsers.mistral_tool_parser.MistralToolCall", "vllm.tool_parsers.mistral_tool_parser.MistralToolParser", "vllm.tool_parsers.mistral_tool_parser.StreamingState", "vllm.tool_parsers.mistral_tool_parser.logger" ], "n_typable": 47, "n_typed": 37, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 24, "n_classes": 3, "n_attrs": 22, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/olmo3_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.olmo3_tool_parser.Olmo3PythonicToolParser", "methods": [ { "kind": "function", "name": "Olmo3PythonicToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Olmo3PythonicToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Olmo3PythonicToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [ { "kind": "property", "name": "Olmo3PythonicToolParser.current_tool_index", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_typable": 2 } ], "attrs": [ { "kind": "attr", "name": "Olmo3PythonicToolParser.TOOL_CALL_REGEX", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 14, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 1, "n_properties": 1 }, { "kind": "attr", "name": "vllm.tool_parsers.olmo3_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.olmo3_tool_parser", "names": [ "vllm.tool_parsers.olmo3_tool_parser.Olmo3PythonicToolParser", "vllm.tool_parsers.olmo3_tool_parser.logger" ], "n_typable": 17, "n_typed": 14, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_classes": 1, "n_attrs": 2, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/openai_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.openai_tool_parser.OpenAIToolParser", "methods": [ { "kind": "function", "name": "OpenAIToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OpenAIToolParser.extract_tool_calls", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OpenAIToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [], "n_typable": 14, "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.openai_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.tool_parsers.openai_tool_parser.TokenizerLike", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.tool_parsers.openai_tool_parser", "names": [ "vllm.tool_parsers.openai_tool_parser.OpenAIToolParser", "vllm.tool_parsers.openai_tool_parser.TokenizerLike", "vllm.tool_parsers.openai_tool_parser.logger" ], "n_typable": 15, "n_typed": 13, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/phi4mini_tool_parser.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.tool_parsers.phi4mini_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.tool_parsers.phi4mini_tool_parser.Phi4MiniJsonToolParser", "methods": [ { "kind": "function", "name": "Phi4MiniJsonToolParser.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Phi4MiniJsonToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Phi4MiniJsonToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Phi4MiniJsonToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MiniJsonToolParser.current_tool_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MiniJsonToolParser.current_tool_name_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MiniJsonToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Phi4MiniJsonToolParser.bot_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 18, "n_typed": 18, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.tool_parsers.phi4mini_tool_parser", "names": [ "vllm.tool_parsers.phi4mini_tool_parser.Phi4MiniJsonToolParser", "vllm.tool_parsers.phi4mini_tool_parser.logger" ], "n_typable": 19, "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/pythonic_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.pythonic_tool_parser.PythonicToolParser", "methods": [ { "kind": "function", "name": "PythonicToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PythonicToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PythonicToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [ { "kind": "property", "name": "PythonicToolParser.current_tool_index", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_typable": 2 } ], "attrs": [ { "kind": "attr", "name": "PythonicToolParser.TOOL_CALL_REGEX", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 14, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 1, "n_properties": 1 }, { "kind": "attr", "name": "vllm.tool_parsers.pythonic_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.pythonic_tool_parser", "names": [ "vllm.tool_parsers.pythonic_tool_parser.PythonicToolParser", "vllm.tool_parsers.pythonic_tool_parser.logger" ], "n_typable": 17, "n_typed": 14, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_classes": 1, "n_attrs": 2, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/qwen3coder_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.qwen3coder_tool_parser.Qwen3CoderToolParser", "methods": [ { "kind": "function", "name": "Qwen3CoderToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3CoderToolParser._generate_tool_call_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3CoderToolParser._reset_streaming_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Qwen3CoderToolParser._get_arguments_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3CoderToolParser._convert_param_value", "n_typed": 4, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Qwen3CoderToolParser._parse_xml_function_call", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3CoderToolParser._get_function_calls", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3CoderToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3CoderToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3CoderToolParser.current_tool_name_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.current_tool_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.tool_call_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.tool_call_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.tool_call_prefix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.function_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.parameter_prefix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.parameter_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.is_tool_call_started", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.failed_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.tool_call_complete_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.tool_call_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.tool_call_function_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.tool_call_parameter_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.tool_call_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3CoderToolParser.tool_call_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 46, "n_typed": 37, "n_any": 1, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 19, "n_attrs": 18, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.qwen3coder_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.qwen3coder_tool_parser", "names": [ "vllm.tool_parsers.qwen3coder_tool_parser.Qwen3CoderToolParser", "vllm.tool_parsers.qwen3coder_tool_parser.logger" ], "n_typable": 47, "n_typed": 37, "n_any": 1, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 19, "n_classes": 1, "n_attrs": 19, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/qwen3xml_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.qwen3xml_tool_parser.Qwen3XMLToolParser", "methods": [ { "kind": "function", "name": "Qwen3XMLToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Qwen3XMLToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3XMLToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3XMLToolParser.parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3XMLToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3XMLToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 16, "n_typed": 14, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.qwen3xml_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.tool_parsers.qwen3xml_tool_parser.StreamingXMLToolCallParser", "methods": [ { "kind": "function", "name": "StreamingXMLToolCallParser.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StreamingXMLToolCallParser.reset_streaming_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StreamingXMLToolCallParser.parse_single_streaming_chunks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._escape_xml_special_chars", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._process_complete_xml_elements", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StreamingXMLToolCallParser._should_skip_element", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._find_next_complete_element", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._merge_new_deltas_to_single_response", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._preprocess_xml_chunk", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._emit_delta", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._auto_close_open_parameter_if_needed", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._start_element", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StreamingXMLToolCallParser._char_data", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._end_element", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser.setup_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StreamingXMLToolCallParser.set_tools", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._extract_function_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StreamingXMLToolCallParser._extract_parameter_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StreamingXMLToolCallParser._get_param_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser.repair_param_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._convert_param_value", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StreamingXMLToolCallParser._convert_for_json_streaming", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StreamingXMLToolCallParser._reset_xml_parser_after_tool_call", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StreamingXMLToolCallParser.tools", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StreamingXMLToolCallParser.tool_call_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StreamingXMLToolCallParser.tool_call_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StreamingXMLToolCallParser.function_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StreamingXMLToolCallParser.function_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StreamingXMLToolCallParser.parameter_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StreamingXMLToolCallParser.parameter_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 53, "n_typed": 41, "n_any": 2, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 23, "n_method_overloads": 23, "n_method_params": 23, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.tool_parsers.qwen3xml_tool_parser", "names": [ "vllm.tool_parsers.qwen3xml_tool_parser.Qwen3XMLToolParser", "vllm.tool_parsers.qwen3xml_tool_parser.StreamingXMLToolCallParser", "vllm.tool_parsers.qwen3xml_tool_parser.logger" ], "n_typable": 70, "n_typed": 55, "n_any": 2, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 26, "n_method_overloads": 26, "n_method_params": 33, "n_classes": 2, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/seed_oss_tool_parser.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.tool_parsers.seed_oss_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.tool_parsers.seed_oss_tool_parser.SeedOssToolParser", "methods": [ { "kind": "function", "name": "SeedOssToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SeedOssToolParser._generate_tool_call_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SeedOssToolParser._reset_streaming_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SeedOssToolParser._parse_xml_function_call", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SeedOssToolParser._get_function_calls", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SeedOssToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SeedOssToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SeedOssToolParser.TOOL_CALL_START", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SeedOssToolParser.TOOL_CALL_END", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SeedOssToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.tool_call_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.tool_call_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.tool_call_prefix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.function_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.parameter_prefix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.parameter_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.think_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.think_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.is_tool_call_started", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.is_thinking_end", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.failed_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.tool_call_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.tool_call_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.think_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.tool_call_complete_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.tool_call_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.tool_call_function_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SeedOssToolParser.tool_call_parameter_regex", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 39, "n_typed": 30, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 13, "n_attrs": 21, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.tool_parsers.seed_oss_tool_parser", "names": [ "vllm.tool_parsers.seed_oss_tool_parser.SeedOssToolParser", "vllm.tool_parsers.seed_oss_tool_parser.logger" ], "n_typable": 40, "n_typed": 30, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 13, "n_classes": 1, "n_attrs": 22, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/step3_tool_parser.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.tool_parsers.step3_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.tool_parsers.step3_tool_parser.Step3ToolParser", "methods": [ { "kind": "function", "name": "Step3ToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3ToolParser.adjust_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3ToolParser._parse_steptml_invoke", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3ToolParser._cast_arguments", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Step3ToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Step3ToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3ToolParser.TOOL_CALLS_BEGIN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Step3ToolParser.TOOL_CALLS_END", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Step3ToolParser.TOOL_CALL_BEGIN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Step3ToolParser.TOOL_CALL_END", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Step3ToolParser.TOOL_SEP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Step3ToolParser.SPECIAL_TOKENS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Step3ToolParser.position", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3ToolParser.tool_block_started", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3ToolParser.tool_block_finished", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 20, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.tool_parsers.step3_tool_parser", "names": [ "vllm.tool_parsers.step3_tool_parser.Step3ToolParser", "vllm.tool_parsers.step3_tool_parser.logger" ], "n_typable": 25, "n_typed": 20, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 15, "n_classes": 1, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/step3p5_tool_parser.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.tool_parsers.step3p5_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.tool_parsers.step3p5_tool_parser.Step3p5ToolParser", "methods": [ { "kind": "function", "name": "Step3p5ToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Step3p5ToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Step3p5ToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Step3p5ToolParser.parser_should_check_for_unstreamed_tool_arg_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3p5ToolParser.parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ToolParser.prev_tool_call_arr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5ToolParser.streamed_args_for_tool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 17, "n_typed": 15, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.tool_parsers.step3p5_tool_parser.StreamingXMLToolCallParser", "methods": [ { "kind": "function", "name": "StreamingXMLToolCallParser.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StreamingXMLToolCallParser.reset_streaming_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StreamingXMLToolCallParser.parse_single_streaming_chunks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._escape_xml_special_chars", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._process_complete_xml_elements", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StreamingXMLToolCallParser._fix_incomplete_tag_in_chunk", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._fix_missing_equals_in_function_tag", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._validate_function_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._validate_parameter_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._should_skip_element", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._find_next_complete_element", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._merge_new_deltas_to_single_response", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._preprocess_xml_chunk", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._emit_delta", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._auto_close_open_parameter_if_needed", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._start_element", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StreamingXMLToolCallParser._char_data", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._end_element", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser.setup_parser", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StreamingXMLToolCallParser.set_tools", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._extract_function_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StreamingXMLToolCallParser._extract_parameter_name", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StreamingXMLToolCallParser._get_param_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser.repair_param_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StreamingXMLToolCallParser._convert_param_value", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StreamingXMLToolCallParser._convert_for_json_streaming", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StreamingXMLToolCallParser._reset_xml_parser_after_tool_call", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StreamingXMLToolCallParser.tools", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StreamingXMLToolCallParser.tool_call_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StreamingXMLToolCallParser.tool_call_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StreamingXMLToolCallParser.function_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StreamingXMLToolCallParser.function_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StreamingXMLToolCallParser.parameter_start_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StreamingXMLToolCallParser.parameter_end_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 61, "n_typed": 49, "n_any": 2, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 27, "n_method_overloads": 27, "n_method_params": 27, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.tool_parsers.step3p5_tool_parser", "names": [ "vllm.tool_parsers.step3p5_tool_parser.Step3p5ToolParser", "vllm.tool_parsers.step3p5_tool_parser.StreamingXMLToolCallParser", "vllm.tool_parsers.step3p5_tool_parser.logger" ], "n_typable": 79, "n_typed": 64, "n_any": 2, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 31, "n_method_overloads": 31, "n_method_params": 37, "n_classes": 2, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.tool_parsers.utils.find_common_suffix", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.tool_parsers.utils.is_complete_json", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.tool_parsers.utils.consume_space", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.tool_parsers.utils.find_common_prefix", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.tool_parsers.utils.extract_intermediate_diff", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.tool_parsers.utils.get_json_schema_from_tools", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.tool_parsers.utils.partial_json_loads", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.tool_parsers.utils", "names": [ "vllm.tool_parsers.utils.consume_space", "vllm.tool_parsers.utils.extract_intermediate_diff", "vllm.tool_parsers.utils.find_common_prefix", "vllm.tool_parsers.utils.find_common_suffix", "vllm.tool_parsers.utils.get_json_schema_from_tools", "vllm.tool_parsers.utils.is_complete_json", "vllm.tool_parsers.utils.partial_json_loads" ], "n_typable": 20, "n_typed": 20, "n_any": 0, "n_untyped": 0, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 13, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tool_parsers/xlam_tool_parser.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tool_parsers.xlam_tool_parser.xLAMToolParser", "methods": [ { "kind": "function", "name": "xLAMToolParser.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "xLAMToolParser.preprocess_model_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "xLAMToolParser.extract_tool_calls", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "xLAMToolParser.extract_tool_calls_streaming", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "xLAMToolParser.prev_tool_calls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "xLAMToolParser.current_tool_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "xLAMToolParser.current_tool_name_sent", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "xLAMToolParser.streamed_args", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "xLAMToolParser.current_tools_sent", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "xLAMToolParser.prev_tool_call_arr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "xLAMToolParser.json_code_block_patterns", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "xLAMToolParser.thinking_tag_pattern", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "xLAMToolParser.streaming_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 24, "n_typed": 18, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 9, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tool_parsers.xlam_tool_parser.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tool_parsers.xlam_tool_parser", "names": [ "vllm.tool_parsers.xlam_tool_parser.logger", "vllm.tool_parsers.xlam_tool_parser.xLAMToolParser" ], "n_typable": 25, "n_typed": 18, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_classes": 1, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tracing/__init__.py", "symbol_reports": [ { "kind": "function", "name": "vllm.tracing.init_tracer", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.tracing.SpanKind", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.tracing.is_tracing_available", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.tracing.instrument_manual", "n_typed": 4, "n_any": 2, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.tracing.instrument", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.tracing.maybe_init_worker_tracer", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.tracing", "names": [ "vllm.tracing.SpanKind", "vllm.tracing.init_tracer", "vllm.tracing.instrument", "vllm.tracing.instrument_manual", "vllm.tracing.is_tracing_available", "vllm.tracing.maybe_init_worker_tracer" ], "n_typable": 21, "n_typed": 15, "n_any": 2, "n_untyped": 4, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 16, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tracing/utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.tracing.utils.SpanAttributes", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SpanAttributes.GEN_AI_USAGE_COMPLETION_TOKENS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_USAGE_PROMPT_TOKENS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_REQUEST_MAX_TOKENS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_REQUEST_TOP_P", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_REQUEST_TEMPERATURE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_RESPONSE_MODEL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_REQUEST_ID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_REQUEST_N", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_USAGE_NUM_SEQUENCES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_LATENCY_TIME_IN_QUEUE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_LATENCY_TIME_TO_FIRST_TOKEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_LATENCY_E2E", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_LATENCY_TIME_IN_SCHEDULER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_LATENCY_TIME_IN_MODEL_FORWARD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_LATENCY_TIME_IN_MODEL_EXECUTE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_LATENCY_TIME_IN_MODEL_PREFILL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_LATENCY_TIME_IN_MODEL_DECODE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpanAttributes.GEN_AI_LATENCY_TIME_IN_MODEL_INFERENCE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 18, "n_properties": 0 }, { "kind": "function", "name": "vllm.tracing.utils.contains_trace_headers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.tracing.utils.log_tracing_disabled_warning", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.tracing.utils.extract_trace_headers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.tracing.utils.LoadingSpanAttributes", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LoadingSpanAttributes.CODE_NAMESPACE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoadingSpanAttributes.CODE_FUNCTION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoadingSpanAttributes.CODE_FILEPATH", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LoadingSpanAttributes.CODE_LINENO", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.tracing.utils.TRACE_HEADERS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.tracing.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.tracing.utils", "names": [ "vllm.tracing.utils.LoadingSpanAttributes", "vllm.tracing.utils.SpanAttributes", "vllm.tracing.utils.TRACE_HEADERS", "vllm.tracing.utils.contains_trace_headers", "vllm.tracing.utils.extract_trace_headers", "vllm.tracing.utils.log_tracing_disabled_warning", "vllm.tracing.utils.logger" ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 2, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 2, "n_attrs": 24, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/tracing/otel.py", "symbol_reports": [ { "kind": "function", "name": "vllm.tracing.otel.extract_trace_context", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.tracing.otel.otel_import_error_traceback", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.tracing.otel.get_span_exporter", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.tracing.otel.instrument_otel", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.tracing.otel.init_otel_worker_tracer", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.tracing.otel.init_otel_tracer", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.tracing.otel.propagate_trace_to_env", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.tracing.otel.inject", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.tracing.otel.Resource", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.tracing.otel.manual_instrument_otel", "n_typed": 5, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.tracing.otel.is_otel_available", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.tracing.otel.trace", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.tracing.otel.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null } ], "name": "vllm.tracing.otel", "names": [ "vllm.tracing.otel.Resource", "vllm.tracing.otel.extract_trace_context", "vllm.tracing.otel.get_span_exporter", "vllm.tracing.otel.init_otel_tracer", "vllm.tracing.otel.init_otel_worker_tracer", "vllm.tracing.otel.inject", "vllm.tracing.otel.instrument_otel", "vllm.tracing.otel.is_otel_available", "vllm.tracing.otel.logger", "vllm.tracing.otel.manual_instrument_otel", "vllm.tracing.otel.otel_import_error_traceback", "vllm.tracing.otel.propagate_trace_to_env", "vllm.tracing.otel.trace" ], "n_typable": 27, "n_typed": 14, "n_any": 3, "n_untyped": 10, "n_functions": 8, "n_function_overloads": 8, "n_function_params": 18, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 6 }, { "path": "vllm/transformers_utils/chat_templates/registry.py", "symbol_reports": [ { "kind": "function", "name": "vllm.transformers_utils.chat_templates.registry.get_chat_template_fallback_path", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.transformers_utils.chat_templates.registry.register_chat_template_fallback_path", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.transformers_utils.chat_templates.registry.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.chat_templates.registry.ChatTemplatePath", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.chat_templates.registry", "names": [ "vllm.transformers_utils.chat_templates.registry.ChatTemplatePath", "vllm.transformers_utils.chat_templates.registry.get_chat_template_fallback_path", "vllm.transformers_utils.chat_templates.registry.logger", "vllm.transformers_utils.chat_templates.registry.register_chat_template_fallback_path" ], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 4, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/config.py", "symbol_reports": [ { "kind": "function", "name": "vllm.transformers_utils.config.get_config", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.transformers_utils.config.is_rope_parameters_nested", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.config.is_encoder_decoder", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.config.uses_mrope", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.config.try_get_safetensors_metadata", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.transformers_utils.config.is_interleaved", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.config.ConfigFormat", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.config.MISTRAL_CONFIG_NAME", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.transformers_utils.config.patch_rope_parameters", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.config.get_safetensors_params_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.transformers_utils.config.get_hf_text_config", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.config.get_sentence_transformer_tokenizer_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.transformers_utils.config.try_get_tokenizer_config", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.transformers_utils.config.parse_pooling_type", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.config.try_get_generation_config", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.transformers_utils.config.set_default_rope_theta", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.transformers_utils.config.HFConfigParser", "methods": [ { "kind": "function", "name": "HFConfigParser.parse", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.config.LazyConfigDict", "methods": [ { "kind": "function", "name": "LazyConfigDict.__getitem__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.transformers_utils.config.uses_xdrope_dim", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.config.get_pooling_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.transformers_utils.config.maybe_register_config_serialize_by_value", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.transformers_utils.config.MistralConfigParser", "methods": [ { "kind": "function", "name": "MistralConfigParser.parse", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.transformers_utils.config.register_config_parser", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.config.get_hf_image_processor_config", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.transformers_utils.config.thinker_uses_mrope", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.config.try_get_dense_modules", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.transformers_utils.config.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.transformers_utils.config.patch_rope_parameters_dict", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.config.maybe_override_with_speculators", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.transformers_utils.config.get_config_parser", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.config", "names": [ "vllm.transformers_utils.config.ConfigFormat", "vllm.transformers_utils.config.HFConfigParser", "vllm.transformers_utils.config.LazyConfigDict", "vllm.transformers_utils.config.MISTRAL_CONFIG_NAME", "vllm.transformers_utils.config.MistralConfigParser", "vllm.transformers_utils.config.get_config", "vllm.transformers_utils.config.get_config_parser", "vllm.transformers_utils.config.get_hf_image_processor_config", "vllm.transformers_utils.config.get_hf_text_config", "vllm.transformers_utils.config.get_pooling_config", "vllm.transformers_utils.config.get_safetensors_params_metadata", "vllm.transformers_utils.config.get_sentence_transformer_tokenizer_config", "vllm.transformers_utils.config.is_encoder_decoder", "vllm.transformers_utils.config.is_interleaved", "vllm.transformers_utils.config.is_rope_parameters_nested", "vllm.transformers_utils.config.logger", "vllm.transformers_utils.config.maybe_override_with_speculators", "vllm.transformers_utils.config.maybe_register_config_serialize_by_value", "vllm.transformers_utils.config.parse_pooling_type", "vllm.transformers_utils.config.patch_rope_parameters", "vllm.transformers_utils.config.patch_rope_parameters_dict", "vllm.transformers_utils.config.register_config_parser", "vllm.transformers_utils.config.set_default_rope_theta", "vllm.transformers_utils.config.thinker_uses_mrope", "vllm.transformers_utils.config.try_get_dense_modules", "vllm.transformers_utils.config.try_get_generation_config", "vllm.transformers_utils.config.try_get_safetensors_metadata", "vllm.transformers_utils.config.try_get_tokenizer_config", "vllm.transformers_utils.config.uses_mrope", "vllm.transformers_utils.config.uses_xdrope_dim" ], "n_typable": 89, "n_typed": 77, "n_any": 0, "n_untyped": 12, "n_functions": 24, "n_function_overloads": 24, "n_function_params": 49, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_classes": 3, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/config_parser_base.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.config_parser_base.ConfigParserBase", "methods": [ { "kind": "function", "name": "ConfigParserBase.parse", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.config_parser_base", "names": [ "vllm.transformers_utils.config_parser_base.ConfigParserBase" ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/AXK1.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.AXK1.AXK1Config", "methods": [ { "kind": "function", "name": "AXK1Config.__init__", "n_typed": 42, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 44, "n_params": 43, "n_function_overloads": 1, "n_function_params": 43 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AXK1Config.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AXK1Config.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AXK1Config.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.moe_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.num_nextn_predict_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.n_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.n_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.ep_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.kv_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.qk_rope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.qk_nope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.topk_method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.n_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.topk_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.num_experts_per_tok", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.moe_layer_freq", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.first_k_dense_replace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.norm_topk_prob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.scoring_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.aux_loss_alpha", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.seq_aux", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.pretraining_tp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.rope_theta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.rope_scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.rope_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.attention_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AXK1Config.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 82, "n_typed": 42, "n_any": 0, "n_untyped": 40, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 43, "n_attrs": 40, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.AXK1", "names": [ "vllm.transformers_utils.configs.AXK1.AXK1Config" ], "n_typable": 82, "n_typed": 42, "n_any": 0, "n_untyped": 40, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 43, "n_classes": 1, "n_attrs": 40, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/__init__.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.transformers_utils.configs.JAISConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.BagelConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.DeepseekV3Config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.FunAudioChatConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.Olmo3Config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.ColQwen3Config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.AXK1Config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.MLPSpeculatorConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.SpeculatorsConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.HunYuanVLVisionConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.EAGLEConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.IsaacConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.PixelShuffleSiglip2VisionConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.ChatGLMConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.RWConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.Step3VLConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.Tarsier2Config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.Qwen3_5Config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.ColModernVBertConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.HunYuanVLTextConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.Qwen3VLNemotronEmbedConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.DeepseekVLV2Config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.KimiVLConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.AfmoeConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.Qwen3_5TextConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.NemotronConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.FunAudioChatAudioEncoderConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.UltravoxConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.Step3VisionEncoderConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.Qwen3NextConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.OpsColQwen3Config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.Lfm2MoeConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.NemotronHConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.RadioConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.MoonViTConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.KimiLinearConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.Qwen3_5MoeConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.MedusaConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.MiDashengLMConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.Step3p5Config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.Qwen3_5MoeTextConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.KimiK25Config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.Qwen3ASRConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.HunYuanVLConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.OvisConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.FlexOlmoConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.DotsOCRConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.Step3TextConfig", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs", "names": [ "vllm.transformers_utils.configs.AXK1Config", "vllm.transformers_utils.configs.AfmoeConfig", "vllm.transformers_utils.configs.BagelConfig", "vllm.transformers_utils.configs.ChatGLMConfig", "vllm.transformers_utils.configs.ColModernVBertConfig", "vllm.transformers_utils.configs.ColQwen3Config", "vllm.transformers_utils.configs.DeepseekV3Config", "vllm.transformers_utils.configs.DeepseekVLV2Config", "vllm.transformers_utils.configs.DotsOCRConfig", "vllm.transformers_utils.configs.EAGLEConfig", "vllm.transformers_utils.configs.FlexOlmoConfig", "vllm.transformers_utils.configs.FunAudioChatAudioEncoderConfig", "vllm.transformers_utils.configs.FunAudioChatConfig", "vllm.transformers_utils.configs.HunYuanVLConfig", "vllm.transformers_utils.configs.HunYuanVLTextConfig", "vllm.transformers_utils.configs.HunYuanVLVisionConfig", "vllm.transformers_utils.configs.IsaacConfig", "vllm.transformers_utils.configs.JAISConfig", "vllm.transformers_utils.configs.KimiK25Config", "vllm.transformers_utils.configs.KimiLinearConfig", "vllm.transformers_utils.configs.KimiVLConfig", "vllm.transformers_utils.configs.Lfm2MoeConfig", "vllm.transformers_utils.configs.MLPSpeculatorConfig", "vllm.transformers_utils.configs.MedusaConfig", "vllm.transformers_utils.configs.MiDashengLMConfig", "vllm.transformers_utils.configs.MoonViTConfig", "vllm.transformers_utils.configs.NemotronConfig", "vllm.transformers_utils.configs.NemotronHConfig", "vllm.transformers_utils.configs.Olmo3Config", "vllm.transformers_utils.configs.OpsColQwen3Config", "vllm.transformers_utils.configs.OvisConfig", "vllm.transformers_utils.configs.PixelShuffleSiglip2VisionConfig", "vllm.transformers_utils.configs.Qwen3ASRConfig", "vllm.transformers_utils.configs.Qwen3NextConfig", "vllm.transformers_utils.configs.Qwen3VLNemotronEmbedConfig", "vllm.transformers_utils.configs.Qwen3_5Config", "vllm.transformers_utils.configs.Qwen3_5MoeConfig", "vllm.transformers_utils.configs.Qwen3_5MoeTextConfig", "vllm.transformers_utils.configs.Qwen3_5TextConfig", "vllm.transformers_utils.configs.RWConfig", "vllm.transformers_utils.configs.RadioConfig", "vllm.transformers_utils.configs.SpeculatorsConfig", "vllm.transformers_utils.configs.Step3TextConfig", "vllm.transformers_utils.configs.Step3VLConfig", "vllm.transformers_utils.configs.Step3VisionEncoderConfig", "vllm.transformers_utils.configs.Step3p5Config", "vllm.transformers_utils.configs.Tarsier2Config", "vllm.transformers_utils.configs.UltravoxConfig" ], "n_typable": 48, "n_typed": 0, "n_any": 0, "n_untyped": 48, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 48, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/afmoe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.afmoe.AfmoeConfig", "methods": [ { "kind": "function", "name": "AfmoeConfig.__init__", "n_typed": 32, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 34, "n_params": 33, "n_function_overloads": 1, "n_function_params": 33 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AfmoeConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AfmoeConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.num_dense_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.rope_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.rope_scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.moe_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.num_experts_per_tok", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.num_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.num_expert_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.num_limited_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.score_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.route_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.route_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.global_attn_every_n_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.layer_types", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.mup_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.n_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AfmoeConfig.topk_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 65, "n_typed": 32, "n_any": 0, "n_untyped": 33, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 33, "n_attrs": 32, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.afmoe", "names": [ "vllm.transformers_utils.configs.afmoe.AfmoeConfig" ], "n_typable": 65, "n_typed": 32, "n_any": 0, "n_untyped": 33, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 33, "n_classes": 1, "n_attrs": 32, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/arctic.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.arctic.ArcticQuantizationConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ArcticQuantizationConfig.q_bits", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ArcticQuantizationConfig.rounding", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ArcticQuantizationConfig.mantissa_bits", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ArcticQuantizationConfig.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.arctic.ARCTIC_PRETRAINED_CONFIG_ARCHIVE_MAP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.arctic.ArcticConfig", "methods": [ { "kind": "function", "name": "ArcticConfig.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 30, "n_overloads": 1, "n_typable": 31, "n_params": 30, "n_function_overloads": 1, "n_function_params": 30 }, { "kind": "function", "name": "ArcticConfig.from_dict", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ArcticConfig.to_dict", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ArcticConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ArcticConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ArcticConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.rope_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.num_experts_per_tok", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.num_local_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.router_aux_loss_coef", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.moe_layer_frequency", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.moe_train_capacity_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.moe_eval_capacity_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.enable_expert_tensor_parallelism", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.moe_min_capacity", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.moe_token_dropping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.parallel_attn_mlp_res", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ArcticConfig.quantization", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 60, "n_typed": 4, "n_any": 0, "n_untyped": 56, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 32, "n_attrs": 27, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.arctic.ArcticLoRAConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ArcticLoRAConfig.lora_r", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ArcticLoRAConfig.lora_alpha", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ArcticLoRAConfig.shard_base_weights", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.arctic.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.arctic", "names": [ "vllm.transformers_utils.configs.arctic.ARCTIC_PRETRAINED_CONFIG_ARCHIVE_MAP", "vllm.transformers_utils.configs.arctic.ArcticConfig", "vllm.transformers_utils.configs.arctic.ArcticLoRAConfig", "vllm.transformers_utils.configs.arctic.ArcticQuantizationConfig", "vllm.transformers_utils.configs.arctic.logger" ], "n_typable": 61, "n_typed": 4, "n_any": 0, "n_untyped": 57, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 32, "n_classes": 3, "n_attrs": 36, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/bagel.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.bagel.BagelConfig", "methods": [ { "kind": "function", "name": "BagelConfig.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 } ], "properties": [ { "kind": "property", "name": "BagelConfig.hidden_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "BagelConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BagelConfig.visual_gen", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelConfig.visual_und", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelConfig.vae_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelConfig.latent_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelConfig.max_latent_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelConfig.vit_max_num_patch_per_side", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelConfig.connector_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelConfig.interpolate_pos", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelConfig.timestep_shift", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelConfig.llm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BagelConfig.vit_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 12, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 12, "n_attrs": 12, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.bagel", "names": [ "vllm.transformers_utils.configs.bagel.BagelConfig" ], "n_typable": 25, "n_typed": 12, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 12, "n_classes": 1, "n_attrs": 12, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/chatglm.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.chatglm.ChatGLMConfig", "methods": [ { "kind": "function", "name": "ChatGLMConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 27, "n_overloads": 1, "n_typable": 27, "n_params": 26, "n_function_overloads": 1, "n_function_params": 26 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChatGLMConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChatGLMConfig.attribute_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ChatGLMConfig.num_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.padded_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.ffn_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.kv_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.seq_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.hidden_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.layernorm_epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.rmsnorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.apply_residual_connection_post_layernorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.post_layer_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.add_bias_linear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.add_qkv_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.bias_dropout_fusion", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.multi_query_attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.multi_query_group_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.apply_query_key_layer_scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.attention_softmax_in_fp32", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.fp32_residual_connection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.quantization_bit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.pre_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.prefix_projection", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ChatGLMConfig.interleaved_qkv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 54, "n_typed": 0, "n_any": 0, "n_untyped": 54, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 26, "n_attrs": 29, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.chatglm", "names": [ "vllm.transformers_utils.configs.chatglm.ChatGLMConfig" ], "n_typable": 54, "n_typed": 0, "n_any": 0, "n_untyped": 54, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 26, "n_classes": 1, "n_attrs": 29, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/colmodernvbert.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.colmodernvbert.ColModernVBertConfig", "methods": [ { "kind": "function", "name": "ColModernVBertConfig.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ColModernVBertConfig.get_text_config", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "ColModernVBertConfig.image_seq_len", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ColModernVBertConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ColModernVBertConfig.embedding_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertConfig.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertConfig.pixel_shuffle_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertConfig.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColModernVBertConfig.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 3, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 7, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.colmodernvbert", "names": [ "vllm.transformers_utils.configs.colmodernvbert.ColModernVBertConfig" ], "n_typable": 13, "n_typed": 3, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_classes": 1, "n_attrs": 7, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/colqwen3.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.colqwen3.OpsColQwen3Config", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "OpsColQwen3Config.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.colqwen3.Qwen3VLNemotronEmbedConfig", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3VLNemotronEmbedConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.colqwen3.ColQwen3Config", "methods": [ { "kind": "function", "name": "ColQwen3Config.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ColQwen3Config.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ColQwen3Config.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColQwen3Config.dims", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColQwen3Config.dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColQwen3Config.projection_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColQwen3Config.colbert_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ColQwen3Config.pooling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 6, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 7, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.colqwen3", "names": [ "vllm.transformers_utils.configs.colqwen3.ColQwen3Config", "vllm.transformers_utils.configs.colqwen3.OpsColQwen3Config", "vllm.transformers_utils.configs.colqwen3.Qwen3VLNemotronEmbedConfig" ], "n_typable": 14, "n_typed": 6, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 7, "n_classes": 3, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/deepseek_vl2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.deepseek_vl2.MlpProjectorConfig", "methods": [ { "kind": "function", "name": "MlpProjectorConfig.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MlpProjectorConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MlpProjectorConfig.projector_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MlpProjectorConfig.input_dim", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MlpProjectorConfig.n_embed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MlpProjectorConfig.depth", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MlpProjectorConfig.mlp_ratio", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MlpProjectorConfig.downsample_ratio", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MlpProjectorConfig.token_pooling", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 15, "n_typed": 13, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 7, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.deepseek_vl2.DeepseekVLV2Config", "methods": [ { "kind": "function", "name": "DeepseekVLV2Config.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekVLV2Config.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Config.architectures", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Config.vision_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Config.projector_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Config.tile_tag", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Config.global_view_pos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Config.candidate_resolutions", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Config.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Config.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.deepseek_vl2.VisionEncoderConfig", "methods": [ { "kind": "function", "name": "VisionEncoderConfig.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "VisionEncoderConfig.model_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderConfig.model_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderConfig.image_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderConfig.patch_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderConfig.width", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderConfig.layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderConfig.heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderConfig.mlp_ratio", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderConfig.global_pool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderConfig.ignore_head", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderConfig.class_token", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderConfig.num_classes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderConfig.use_checkpoint", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderConfig.weight_init", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderConfig.deterministic", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "VisionEncoderConfig.num_recomputing_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 30, "n_typed": 28, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 13, "n_attrs": 16, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.deepseek_vl2", "names": [ "vllm.transformers_utils.configs.deepseek_vl2.DeepseekVLV2Config", "vllm.transformers_utils.configs.deepseek_vl2.MlpProjectorConfig", "vllm.transformers_utils.configs.deepseek_vl2.VisionEncoderConfig" ], "n_typable": 59, "n_typed": 50, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 24, "n_classes": 3, "n_attrs": 33, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/dotsocr.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.dotsocr.DotsOCRConfig", "methods": [ { "kind": "function", "name": "DotsOCRConfig.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DotsOCRConfig.save_pretrained", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DotsOCRConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DotsOCRConfig.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsOCRConfig.video_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsOCRConfig.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 1, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.dotsocr.DotsVisionConfig", "methods": [ { "kind": "function", "name": "DotsVisionConfig.__init__", "n_typed": 11, "n_any": 1, "n_untyped": 7, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DotsVisionConfig.model_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.num_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.temporal_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.use_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.attn_implementation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.init_merger_std", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.is_causal", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.post_norm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DotsVisionConfig.gradient_checkpointing", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 37, "n_typed": 12, "n_any": 1, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 18, "n_attrs": 18, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.dotsocr", "names": [ "vllm.transformers_utils.configs.dotsocr.DotsOCRConfig", "vllm.transformers_utils.configs.dotsocr.DotsVisionConfig" ], "n_typable": 49, "n_typed": 13, "n_any": 1, "n_untyped": 35, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 25, "n_classes": 2, "n_attrs": 22, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/eagle.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.eagle.EAGLEConfig", "methods": [ { "kind": "function", "name": "EAGLEConfig.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EAGLEConfig.from_pretrained", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EAGLEConfig.to_json_string", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EAGLEConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EAGLEConfig.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EAGLEConfig.truncated_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.eagle", "names": [ "vllm.transformers_utils.configs.eagle.EAGLEConfig" ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/extract_hidden_states.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.extract_hidden_states.ExtractHiddenStatesConfig", "methods": [ { "kind": "function", "name": "ExtractHiddenStatesConfig.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ExtractHiddenStatesConfig.from_pretrained", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExtractHiddenStatesConfig.to_json_string", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExtractHiddenStatesConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 9, "n_typed": 6, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.extract_hidden_states", "names": [ "vllm.transformers_utils.configs.extract_hidden_states.ExtractHiddenStatesConfig" ], "n_typable": 9, "n_typed": 6, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/falcon.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.falcon.RWConfig", "methods": [ { "kind": "function", "name": "RWConfig.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 18, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 } ], "properties": [ { "kind": "property", "name": "RWConfig.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "RWConfig.rotary", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "RWConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RWConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RWConfig.attribute_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RWConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.n_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.n_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.layer_norm_epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.hidden_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.bos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.eos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.multi_query", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.n_head_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.alibi", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.parallel_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RWConfig.new_decoder_architecture", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 38, "n_typed": 1, "n_any": 0, "n_untyped": 37, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 18, "n_attrs": 20, "n_properties": 2 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.falcon", "names": [ "vllm.transformers_utils.configs.falcon.RWConfig" ], "n_typable": 38, "n_typed": 1, "n_any": 0, "n_untyped": 37, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 18, "n_classes": 1, "n_attrs": 20, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/flex_olmo.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.flex_olmo.FlexOlmoConfig", "methods": [ { "kind": "function", "name": "FlexOlmoConfig.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 24, "n_overloads": 1, "n_typable": 25, "n_params": 24, "n_function_overloads": 1, "n_function_params": 24 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlexOlmoConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexOlmoConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexOlmoConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.rope_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.attention_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.num_experts_per_tok", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.output_router_logits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.router_aux_loss_coef", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexOlmoConfig.norm_topk_prob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 44, "n_typed": 1, "n_any": 0, "n_untyped": 43, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 24, "n_attrs": 21, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.flex_olmo", "names": [ "vllm.transformers_utils.configs.flex_olmo.FlexOlmoConfig" ], "n_typable": 44, "n_typed": 1, "n_any": 0, "n_untyped": 43, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 24, "n_classes": 1, "n_attrs": 21, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/funaudiochat.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.funaudiochat.FunAudioChatAudioEncoderConfig", "methods": [ { "kind": "function", "name": "FunAudioChatAudioEncoderConfig.__init__", "n_typed": 24, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 25, "n_params": 24, "n_function_overloads": 1, "n_function_params": 24 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.num_mel_bins", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.d_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.encoder_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.encoder_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.encoder_ffn_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.activation_function", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.activation_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.scale_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.max_source_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.n_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.output_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.bos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.codebook_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.continuous_features_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.crq_transformer_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.eos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.group_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.enable_audio_invert_tower", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatAudioEncoderConfig.pad_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 48, "n_typed": 24, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 24, "n_attrs": 24, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.funaudiochat.FunAudioChatConfig", "methods": [ { "kind": "function", "name": "FunAudioChatConfig.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FunAudioChatConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FunAudioChatConfig.attribute_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FunAudioChatConfig.audio_token_index", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatConfig.ignore_index", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatConfig.audio_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatConfig.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunAudioChatConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 6, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.funaudiochat", "names": [ "vllm.transformers_utils.configs.funaudiochat.FunAudioChatAudioEncoderConfig", "vllm.transformers_utils.configs.funaudiochat.FunAudioChatConfig" ], "n_typable": 60, "n_typed": 30, "n_any": 0, "n_untyped": 30, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 30, "n_classes": 2, "n_attrs": 31, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/hunyuan_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.hunyuan_vl.HunYuanVLVisionConfig", "methods": [ { "kind": "function", "name": "HunYuanVLVisionConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 26, "n_overloads": 1, "n_typable": 26, "n_params": 25, "n_function_overloads": 1, "n_function_params": 25 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanVLVisionConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.base_config_key", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.interpolate_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.learnable_mlp_pooling_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.num_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.out_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.remove_prenorm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.spatial_merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.temporal_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.resize_resolution", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.img_max_token_num", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.max_image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.min_image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.video_max_image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.video_min_image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.anyres_vit_max_image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.max_vit_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.text_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLVisionConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 50, "n_typed": 0, "n_any": 0, "n_untyped": 50, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 25, "n_attrs": 26, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.hunyuan_vl.HunYuanVLConfig", "methods": [ { "kind": "function", "name": "HunYuanVLConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "HunYuanVLConfig.__setattr__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunYuanVLConfig.__getattribute__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanVLConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "HunYuanVLConfig.sub_configs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "HunYuanVLConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "HunYuanVLConfig.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLConfig.im_start_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLConfig.im_end_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLConfig.im_newline_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLConfig.video_start_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLConfig.video_end_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLConfig.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLConfig.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 0, "n_any": 0, "n_untyped": 23, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 12, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.hunyuan_vl.HunYuanVLTextConfig", "methods": [ { "kind": "function", "name": "HunYuanVLTextConfig.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 23, "n_overloads": 1, "n_typable": 24, "n_params": 23, "n_function_overloads": 1, "n_function_params": 23 }, { "kind": "function", "name": "HunYuanVLTextConfig._rope_scaling_validation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanVLTextConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "HunYuanVLTextConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "HunYuanVLTextConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.pretraining_tp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.rope_theta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.rope_scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.attention_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLTextConfig.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 42, "n_typed": 1, "n_any": 0, "n_untyped": 41, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 23, "n_attrs": 19, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.hunyuan_vl", "names": [ "vllm.transformers_utils.configs.hunyuan_vl.HunYuanVLConfig", "vllm.transformers_utils.configs.hunyuan_vl.HunYuanVLTextConfig", "vllm.transformers_utils.configs.hunyuan_vl.HunYuanVLVisionConfig" ], "n_typable": 115, "n_typed": 1, "n_any": 0, "n_untyped": 114, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 60, "n_classes": 3, "n_attrs": 56, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/isaac.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.isaac.PixelShuffleSiglip2VisionConfig", "methods": [ { "kind": "function", "name": "PixelShuffleSiglip2VisionConfig.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PixelShuffleSiglip2VisionConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PixelShuffleSiglip2VisionConfig.base_config_key", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PixelShuffleSiglip2VisionConfig.pixel_shuffle_scale_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PixelShuffleSiglip2VisionConfig.num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 2, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.isaac.IsaacConfig", "methods": [ { "kind": "function", "name": "IsaacConfig.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "IsaacConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IsaacConfig.sub_configs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IsaacConfig.video_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacConfig.vision_max_num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacConfig.vision_min_num_patches", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacConfig.pixel_shuffle_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacConfig.max_sequence_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacConfig.vision_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacConfig.vision_attn_implementation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacConfig.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IsaacConfig.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 7, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 10, "n_attrs": 11, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.isaac", "names": [ "vllm.transformers_utils.configs.isaac.IsaacConfig", "vllm.transformers_utils.configs.isaac.PixelShuffleSiglip2VisionConfig" ], "n_typable": 26, "n_typed": 9, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 13, "n_classes": 2, "n_attrs": 15, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/jais.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.jais.JAISConfig", "methods": [ { "kind": "function", "name": "JAISConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 27, "n_overloads": 1, "n_typable": 27, "n_params": 26, "n_function_overloads": 1, "n_function_params": 26 }, { "kind": "function", "name": "JAISConfig._alibi_scaling_validation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "JAISConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "JAISConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "JAISConfig.attribute_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "JAISConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.n_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.n_embd", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.n_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.n_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.n_inner", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.activation_function", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.resid_pdrop", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.embd_pdrop", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.attn_pdrop", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.layer_norm_epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.scale_attn_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.scale_attn_by_inverse_layer_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.reorder_and_upcast_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.bos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.eos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.position_embedding_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.mup_width_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.mup_embeddings_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.mup_output_alpha", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.mup_scale_qk_dot_by_d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "JAISConfig.alibi_scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 52, "n_typed": 0, "n_any": 0, "n_untyped": 52, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 26, "n_attrs": 27, "n_properties": 0 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.jais.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.jais", "names": [ "vllm.transformers_utils.configs.jais.JAISConfig", "vllm.transformers_utils.configs.jais.logger" ], "n_typable": 53, "n_typed": 0, "n_any": 0, "n_untyped": 53, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 26, "n_classes": 1, "n_attrs": 28, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/kimi_k25.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.kimi_k25.KimiK25VisionConfig", "methods": [ { "kind": "function", "name": "KimiK25VisionConfig.__init__", "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiK25VisionConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KimiK25VisionConfig.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25VisionConfig.init_pos_emb_height", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25VisionConfig.init_pos_emb_width", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25VisionConfig.init_pos_emb_time", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25VisionConfig.pos_emb_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25VisionConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25VisionConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25VisionConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25VisionConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25VisionConfig.merge_kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25VisionConfig.video_attn_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25VisionConfig.merge_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25VisionConfig.mm_projector_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25VisionConfig.projector_hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25VisionConfig.projector_ln_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25VisionConfig.mm_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 16, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 17, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.kimi_k25.KimiK25Config", "methods": [ { "kind": "function", "name": "KimiK25Config.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [ { "kind": "property", "name": "KimiK25Config.hidden_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "KimiK25Config.vocab_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "KimiK25Config.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KimiK25Config.vision_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25Config.text_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25Config.ignore_index", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25Config.media_placeholder_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25Config.use_unified_vision_chunk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25Config.video_placeholder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiK25Config.quantization_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 8, "n_attrs": 8, "n_properties": 2 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.kimi_k25", "names": [ "vllm.transformers_utils.configs.kimi_k25.KimiK25Config", "vllm.transformers_utils.configs.kimi_k25.KimiK25VisionConfig" ], "n_typable": 52, "n_typed": 27, "n_any": 0, "n_untyped": 25, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 25, "n_classes": 2, "n_attrs": 25, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/kimi_linear.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.kimi_linear.KimiLinearConfig", "methods": [ { "kind": "function", "name": "KimiLinearConfig.__init__", "n_typed": 20, "n_any": 0, "n_untyped": 19, "n_overloads": 1, "n_typable": 39, "n_params": 38, "n_function_overloads": 1, "n_function_params": 38 }, { "kind": "function", "name": "KimiLinearConfig.is_kda_layer", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "KimiLinearConfig.is_mla", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "KimiLinearConfig.is_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "KimiLinearConfig.is_linear_attn", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "KimiLinearConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KimiLinearConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.rope_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.q_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.kv_lora_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.qk_nope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.qk_rope_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.v_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.mla_use_nope", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.num_experts_per_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.moe_renormalize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.num_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.moe_router_activation_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.moe_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.first_k_dense_replace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.moe_layer_freq", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.use_grouped_topk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.num_expert_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.topk_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.num_nextn_predict_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiLinearConfig.linear_attn_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 77, "n_typed": 22, "n_any": 0, "n_untyped": 55, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 39, "n_attrs": 34, "n_properties": 3 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.kimi_linear.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.kimi_linear", "names": [ "vllm.transformers_utils.configs.kimi_linear.KimiLinearConfig", "vllm.transformers_utils.configs.kimi_linear.logger" ], "n_typable": 78, "n_typed": 22, "n_any": 0, "n_untyped": 56, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 39, "n_classes": 1, "n_attrs": 35, "n_properties": 3, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/kimi_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.kimi_vl.KimiVLConfig", "methods": [ { "kind": "function", "name": "KimiVLConfig.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KimiVLConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KimiVLConfig.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLConfig.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLConfig.ignore_index", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KimiVLConfig.media_placeholder_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 5, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.kimi_vl", "names": [ "vllm.transformers_utils.configs.kimi_vl.KimiVLConfig" ], "n_typable": 11, "n_typed": 5, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_classes": 1, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/lfm2_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.lfm2_moe.Lfm2MoeConfig", "methods": [ { "kind": "function", "name": "Lfm2MoeConfig.__init__", "n_typed": 24, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 26, "n_params": 25, "n_function_overloads": 1, "n_function_params": 25 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Lfm2MoeConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Lfm2MoeConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Lfm2MoeConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.rope_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.conv_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.conv_L_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.num_dense_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.moe_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.num_experts_per_tok", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.use_expert_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.norm_topk_prob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Lfm2MoeConfig.layer_types", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 46, "n_typed": 24, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 25, "n_attrs": 22, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.lfm2_moe", "names": [ "vllm.transformers_utils.configs.lfm2_moe.Lfm2MoeConfig" ], "n_typable": 46, "n_typed": 24, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 25, "n_classes": 1, "n_attrs": 22, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/medusa.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.medusa.MedusaConfig", "methods": [ { "kind": "function", "name": "MedusaConfig.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "MedusaConfig.from_pretrained", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "MedusaConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "MedusaConfig.num_lookahead_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_typable": 2 } ], "attrs": [ { "kind": "attr", "name": "MedusaConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MedusaConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MedusaConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MedusaConfig.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MedusaConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MedusaConfig.max_paths", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MedusaConfig.topk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MedusaConfig.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MedusaConfig.truncated_vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 10, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 9, "n_properties": 2 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.medusa", "names": [ "vllm.transformers_utils.configs.medusa.MedusaConfig" ], "n_typable": 23, "n_typed": 10, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_classes": 1, "n_attrs": 9, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/midashenglm.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.midashenglm.DashengConfig", "methods": [ { "kind": "function", "name": "DashengConfig.__init__", "n_typed": 21, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 23, "n_params": 22, "n_function_overloads": 1, "n_function_params": 22 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DashengConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DashengConfig.embed_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.outputdim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.patch_stride", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.input_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.target_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.depth", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.mlp_ratio", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.qkv_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.init_values", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.drop_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.attn_drop_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.f_min", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.f_max", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.center", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.win_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.hop_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.sample_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.n_fft", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DashengConfig.n_mels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 44, "n_typed": 21, "n_any": 0, "n_untyped": 23, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 22, "n_attrs": 22, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.midashenglm.MiDashengLMConfig", "methods": [ { "kind": "function", "name": "MiDashengLMConfig.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MiDashengLMConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MiDashengLMConfig.audio_encoder_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiDashengLMConfig.subsample_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiDashengLMConfig.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MiDashengLMConfig.audio_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 4, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.midashenglm", "names": [ "vllm.transformers_utils.configs.midashenglm.DashengConfig", "vllm.transformers_utils.configs.midashenglm.MiDashengLMConfig" ], "n_typable": 54, "n_typed": 25, "n_any": 0, "n_untyped": 29, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 27, "n_classes": 2, "n_attrs": 27, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/mistral.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.transformers_utils.configs.mistral.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.transformers_utils.configs.mistral.adapt_config_dict", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.mistral", "names": [ "vllm.transformers_utils.configs.mistral.adapt_config_dict", "vllm.transformers_utils.configs.mistral.logger" ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/mlp_speculator.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.mlp_speculator.MLPSpeculatorConfig", "methods": [ { "kind": "function", "name": "MLPSpeculatorConfig.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MLPSpeculatorConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLPSpeculatorConfig.attribute_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MLPSpeculatorConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculatorConfig.emb_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculatorConfig.inner_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculatorConfig.n_predict", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculatorConfig.top_k_tokens_per_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculatorConfig.n_candidates", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculatorConfig.num_lookahead_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculatorConfig.tie_weights", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MLPSpeculatorConfig.scale_input", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 8, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 9, "n_attrs": 11, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.mlp_speculator", "names": [ "vllm.transformers_utils.configs.mlp_speculator.MLPSpeculatorConfig" ], "n_typable": 19, "n_typed": 8, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 9, "n_classes": 1, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/moonvit.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.moonvit.MoonViTConfig", "methods": [ { "kind": "function", "name": "MoonViTConfig.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MoonViTConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoonViTConfig.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTConfig.init_pos_emb_height", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTConfig.init_pos_emb_width", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MoonViTConfig.merge_kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 8, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 9, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.moonvit", "names": [ "vllm.transformers_utils.configs.moonvit.MoonViTConfig" ], "n_typable": 18, "n_typed": 8, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 9, "n_classes": 1, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/nemotron.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.transformers_utils.configs.nemotron.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.transformers_utils.configs.nemotron.NemotronConfig", "methods": [ { "kind": "function", "name": "NemotronConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 22, "n_overloads": 1, "n_typable": 22, "n_params": 21, "n_function_overloads": 1, "n_function_params": 21 }, { "kind": "function", "name": "NemotronConfig._rope_parameters_validation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NemotronConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NemotronConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NemotronConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronConfig.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronConfig.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronConfig.norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronConfig.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronConfig.rope_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronConfig.attention_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronConfig.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronConfig.mlp_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 39, "n_typed": 0, "n_any": 0, "n_untyped": 39, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 21, "n_attrs": 18, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.nemotron", "names": [ "vllm.transformers_utils.configs.nemotron.NemotronConfig", "vllm.transformers_utils.configs.nemotron.logger" ], "n_typable": 40, "n_typed": 0, "n_any": 0, "n_untyped": 40, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 21, "n_classes": 1, "n_attrs": 19, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/nemotron_h.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.nemotron_h.NemotronHConfig", "methods": [ { "kind": "function", "name": "NemotronHConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 54, "n_overloads": 1, "n_typable": 54, "n_params": 53, "n_function_overloads": 1, "n_function_params": 53 } ], "properties": [ { "kind": "property", "name": "NemotronHConfig.layers_block_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "NemotronHConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NemotronHConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NemotronHConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.tie_word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.hybrid_override_pattern", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.mtp_hybrid_override_pattern", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.hidden_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.mlp_hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.attention_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.mlp_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.use_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.layer_norm_epsilon", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.residual_in_fp32", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.num_logits_to_keep", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.use_mamba_kernels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.n_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.mamba_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.ssm_state_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.mamba_num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.conv_kernel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.expand", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.mamba_hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.time_step_min", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.time_step_max", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.time_step_limit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.time_step_floor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.use_conv_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.mamba_proj_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.chunk_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.rescale_prenorm_residual", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.n_routed_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.n_shared_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.moe_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.moe_shared_expert_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.moe_latent_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.num_experts_per_tok", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.routed_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.n_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.topk_group", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NemotronHConfig.norm_topk_prob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 104, "n_typed": 0, "n_any": 0, "n_untyped": 104, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 53, "n_attrs": 51, "n_properties": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.nemotron_h.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.nemotron_h", "names": [ "vllm.transformers_utils.configs.nemotron_h.NemotronHConfig", "vllm.transformers_utils.configs.nemotron_h.logger" ], "n_typable": 105, "n_typed": 0, "n_any": 0, "n_untyped": 105, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 53, "n_classes": 1, "n_attrs": 52, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/olmo3.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.olmo3.Olmo3Config", "methods": [ { "kind": "function", "name": "Olmo3Config.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 22, "n_overloads": 1, "n_typable": 22, "n_params": 21, "n_function_overloads": 1, "n_function_params": 21 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Olmo3Config.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Olmo3Config.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Olmo3Config.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3Config.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3Config.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3Config.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3Config.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3Config.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3Config.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3Config.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3Config.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3Config.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3Config.rope_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3Config.attention_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3Config.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3Config.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3Config.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Olmo3Config.layer_types", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 38, "n_typed": 0, "n_any": 0, "n_untyped": 38, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 21, "n_attrs": 18, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.olmo3", "names": [ "vllm.transformers_utils.configs.olmo3.Olmo3Config" ], "n_typable": 38, "n_typed": 0, "n_any": 0, "n_untyped": 38, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 21, "n_classes": 1, "n_attrs": 18, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/ovis.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.ovis.SiglipVisualTokenizerConfig", "methods": [ { "kind": "function", "name": "SiglipVisualTokenizerConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SiglipVisualTokenizerConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SiglipVisualTokenizerConfig.drop_cls_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 3, "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.ovis.AIMv2Config", "methods": [ { "kind": "function", "name": "AIMv2Config.__init__", "n_typed": 12, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AIMv2Config.model_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Config.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Config.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Config.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Config.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Config.num_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Config.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Config.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Config.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Config.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Config.projection_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Config.qkv_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AIMv2Config.use_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 27, "n_typed": 13, "n_any": 1, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 13, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.ovis.BaseVisualTokenizerConfig", "methods": [ { "kind": "function", "name": "BaseVisualTokenizerConfig.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseVisualTokenizerConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseVisualTokenizerConfig.tokenize_function", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseVisualTokenizerConfig.tau", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseVisualTokenizerConfig.depths", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseVisualTokenizerConfig.backbone_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseVisualTokenizerConfig.drop_cls_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseVisualTokenizerConfig.backbone_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseVisualTokenizerConfig.hidden_stride", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 2, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 8, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.ovis.Aimv2VisualTokenizerConfig", "methods": [ { "kind": "function", "name": "Aimv2VisualTokenizerConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Aimv2VisualTokenizerConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Aimv2VisualTokenizerConfig.drop_cls_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 3, "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.ovis.OvisConfig", "methods": [ { "kind": "function", "name": "OvisConfig.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OvisConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OvisConfig.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OvisConfig.visual_tokenizer_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OvisConfig.multimodal_max_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OvisConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OvisConfig.conversation_formatter_class", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OvisConfig.llm_attn_implementation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OvisConfig.disable_tie_weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 2, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 8, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.ovis", "names": [ "vllm.transformers_utils.configs.ovis.AIMv2Config", "vllm.transformers_utils.configs.ovis.Aimv2VisualTokenizerConfig", "vllm.transformers_utils.configs.ovis.BaseVisualTokenizerConfig", "vllm.transformers_utils.configs.ovis.OvisConfig", "vllm.transformers_utils.configs.ovis.SiglipVisualTokenizerConfig" ], "n_typable": 66, "n_typed": 17, "n_any": 1, "n_untyped": 48, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 31, "n_classes": 5, "n_attrs": 33, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/parakeet.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.parakeet.ParakeetConfig", "methods": [ { "kind": "function", "name": "ParakeetConfig.from_hf_config", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ParakeetConfig.llm_hidden_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParakeetConfig.projection_hidden_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParakeetConfig.projection_bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParakeetConfig.projection_eps", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParakeetConfig.sampling_rate", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.parakeet.ExtractorConfig", "methods": [ { "kind": "function", "name": "ExtractorConfig.from_hf_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExtractorConfig.feature_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExtractorConfig.sampling_rate", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExtractorConfig.subsampling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExtractorConfig.subsampling_conv_kernel_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExtractorConfig.subsampling_conv_stride", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExtractorConfig.clip_duration_s", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExtractorConfig.clip_min_duration_s", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.parakeet", "names": [ "vllm.transformers_utils.configs.parakeet.ExtractorConfig", "vllm.transformers_utils.configs.parakeet.ParakeetConfig" ], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_classes": 2, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/qwen3_5.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.qwen3_5.Qwen3_5TextConfig", "methods": [ { "kind": "function", "name": "Qwen3_5TextConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 27, "n_overloads": 1, "n_typable": 27, "n_params": 26, "n_function_overloads": 1, "n_function_params": 26 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_5TextConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5TextConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5TextConfig.base_model_tp_plan", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5TextConfig.base_model_pp_plan", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5TextConfig.base_config_key", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5TextConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.attention_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.rope_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.layer_types", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.linear_conv_kernel_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.linear_key_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.linear_value_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.linear_num_key_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.linear_num_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.pad_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.bos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.eos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5TextConfig.tie_word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 52, "n_typed": 0, "n_any": 0, "n_untyped": 52, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 26, "n_attrs": 30, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.qwen3_5.Qwen3_5Config", "methods": [ { "kind": "function", "name": "Qwen3_5Config.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 9, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_5Config.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5Config.sub_configs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5Config.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5Config.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5Config.video_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5Config.vision_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5Config.vision_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5Config.tie_word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5Config.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5Config.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 0, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 8, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.qwen3_5", "names": [ "vllm.transformers_utils.configs.qwen3_5.Qwen3_5Config", "vllm.transformers_utils.configs.qwen3_5.Qwen3_5TextConfig" ], "n_typable": 68, "n_typed": 0, "n_any": 0, "n_untyped": 68, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 34, "n_classes": 2, "n_attrs": 40, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/qwen3_5_moe.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.qwen3_5_moe.Qwen3_5MoeTextConfig", "methods": [ { "kind": "function", "name": "Qwen3_5MoeTextConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 32, "n_overloads": 1, "n_typable": 32, "n_params": 31, "n_function_overloads": 1, "n_function_params": 31 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_5MoeTextConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.base_model_tp_plan", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.base_model_pp_plan", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.base_config_key", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.attention_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.rope_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.layer_types", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.linear_conv_kernel_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.linear_key_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.linear_value_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.linear_num_key_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.linear_num_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.moe_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.shared_expert_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.num_experts_per_tok", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.output_router_logits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.router_aux_loss_coef", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.pad_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.bos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.eos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeTextConfig.tie_word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 62, "n_typed": 0, "n_any": 0, "n_untyped": 62, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 31, "n_attrs": 35, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.qwen3_5_moe.Qwen3_5MoeConfig", "methods": [ { "kind": "function", "name": "Qwen3_5MoeConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 9, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3_5MoeConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5MoeConfig.sub_configs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5MoeConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3_5MoeConfig.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeConfig.video_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeConfig.vision_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeConfig.vision_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeConfig.tie_word_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeConfig.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3_5MoeConfig.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 0, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 8, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.qwen3_5_moe", "names": [ "vllm.transformers_utils.configs.qwen3_5_moe.Qwen3_5MoeConfig", "vllm.transformers_utils.configs.qwen3_5_moe.Qwen3_5MoeTextConfig" ], "n_typable": 78, "n_typed": 0, "n_any": 0, "n_untyped": 78, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 39, "n_classes": 2, "n_attrs": 45, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/qwen3_asr.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.qwen3_asr.Qwen3ASRAudioEncoderConfig", "methods": [ { "kind": "function", "name": "Qwen3ASRAudioEncoderConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 19, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.num_mel_bins", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.d_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.encoder_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.encoder_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.encoder_ffn_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.activation_function", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.activation_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.scale_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.max_source_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.n_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.output_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.n_window_infer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.conv_chunksize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRAudioEncoderConfig.downsample_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 37, "n_typed": 0, "n_any": 0, "n_untyped": 37, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 18, "n_attrs": 19, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.qwen3_asr.Qwen3ASRConfig", "methods": [ { "kind": "function", "name": "Qwen3ASRConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3ASRConfig.get_text_config", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3ASRConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3ASRConfig.sub_configs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3ASRConfig.thinker_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRConfig.support_languages", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 1, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.qwen3_asr.Qwen3ASRThinkerConfig", "methods": [ { "kind": "function", "name": "Qwen3ASRThinkerConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3ASRThinkerConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3ASRThinkerConfig.attribute_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3ASRThinkerConfig.sub_configs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3ASRThinkerConfig.user_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRThinkerConfig.audio_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRThinkerConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRThinkerConfig.audio_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRThinkerConfig.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRThinkerConfig.audio_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 0, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 7, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.qwen3_asr", "names": [ "vllm.transformers_utils.configs.qwen3_asr.Qwen3ASRAudioEncoderConfig", "vllm.transformers_utils.configs.qwen3_asr.Qwen3ASRConfig", "vllm.transformers_utils.configs.qwen3_asr.Qwen3ASRThinkerConfig" ], "n_typable": 59, "n_typed": 1, "n_any": 0, "n_untyped": 58, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 29, "n_classes": 3, "n_attrs": 32, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/qwen3_next.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.qwen3_next.Qwen3NextConfig", "methods": [ { "kind": "function", "name": "Qwen3NextConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 33, "n_overloads": 1, "n_typable": 33, "n_params": 32, "n_function_overloads": 1, "n_function_params": 32 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3NextConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3NextConfig.keys_to_ignore_at_inference", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3NextConfig.base_model_tp_plan", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3NextConfig.base_model_pp_plan", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3NextConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.num_key_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.initializer_range", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.use_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.rope_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.partial_rotary_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.attention_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.attention_dropout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.layer_types", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.linear_conv_kernel_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.linear_key_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.linear_value_head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.linear_num_key_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.linear_num_value_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.decoder_sparse_step", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.moe_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.shared_expert_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.num_experts_per_tok", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.norm_topk_prob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.output_router_logits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.router_aux_loss_coef", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3NextConfig.mlp_only_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 64, "n_typed": 0, "n_any": 0, "n_untyped": 64, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 32, "n_attrs": 35, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.qwen3_next", "names": [ "vllm.transformers_utils.configs.qwen3_next.Qwen3NextConfig" ], "n_typable": 64, "n_typed": 0, "n_any": 0, "n_untyped": 64, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 32, "n_classes": 1, "n_attrs": 35, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/radio.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.transformers_utils.configs.radio.OPENAI_CLIP_MEAN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.radio.RadioConfig", "methods": [ { "kind": "function", "name": "RadioConfig.__init__", "n_typed": 15, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RadioConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RadioConfig.model_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioConfig.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioConfig.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioConfig.qkv_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioConfig.qk_normalization", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioConfig.norm_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioConfig.layer_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioConfig.initializer_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioConfig.cpe_max_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioConfig.norm_mean", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioConfig.norm_std", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioConfig.register_multiple", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioConfig.teachers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RadioConfig.cls_token_per_teacher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 32, "n_typed": 15, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 16, "n_attrs": 16, "n_properties": 0 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.radio.VIT_TIMM_DIM_BY_NAME", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.radio.OPENAI_CLIP_STD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.transformers_utils.configs.radio.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.radio", "names": [ "vllm.transformers_utils.configs.radio.OPENAI_CLIP_MEAN", "vllm.transformers_utils.configs.radio.OPENAI_CLIP_STD", "vllm.transformers_utils.configs.radio.RadioConfig", "vllm.transformers_utils.configs.radio.VIT_TIMM_DIM_BY_NAME", "vllm.transformers_utils.configs.radio.logger" ], "n_typable": 34, "n_typed": 16, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 16, "n_classes": 1, "n_attrs": 20, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/speculators/algos.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.transformers_utils.configs.speculators.algos.SUPPORTED_SPECULATORS_TYPES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.transformers_utils.configs.speculators.algos.register_speculator", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.configs.speculators.algos.update_eagle3", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.speculators.algos", "names": [ "vllm.transformers_utils.configs.speculators.algos.SUPPORTED_SPECULATORS_TYPES", "vllm.transformers_utils.configs.speculators.algos.register_speculator", "vllm.transformers_utils.configs.speculators.algos.update_eagle3" ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/speculators/base.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.speculators.base.SpeculatorsConfig", "methods": [ { "kind": "function", "name": "SpeculatorsConfig.from_pretrained", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SpeculatorsConfig.extract_transformers_pre_trained_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SpeculatorsConfig.extract_vllm_speculative_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SpeculatorsConfig.validate_speculators_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SpeculatorsConfig.build_vllm_speculative_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SpeculatorsConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 11, "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.speculators.base", "names": [ "vllm.transformers_utils.configs.speculators.base.SpeculatorsConfig" ], "n_typable": 11, "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/step3_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.step3_vl.Step3VLConfig", "methods": [ { "kind": "function", "name": "Step3VLConfig.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3VLConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Step3VLConfig.vision_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLConfig.text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLConfig.understand_projector_stride", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLConfig.projector_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VLConfig.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 6, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.step3_vl.Step3VisionEncoderConfig", "methods": [ { "kind": "function", "name": "Step3VisionEncoderConfig.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 12, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3VisionEncoderConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Step3VisionEncoderConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEncoderConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEncoderConfig.output_hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEncoderConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEncoderConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEncoderConfig.num_channels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEncoderConfig.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEncoderConfig.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEncoderConfig.layer_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3VisionEncoderConfig.hidden_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 0, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 11, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.configs.step3_vl.Step3TextConfig", "methods": [ { "kind": "function", "name": "Step3TextConfig.__init__", "n_typed": 19, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 20, "n_params": 19, "n_function_overloads": 1, "n_function_params": 19 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3TextConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Step3TextConfig.architectures", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Step3TextConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.num_attention_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.moe_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.moe_num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.moe_top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.rope_parameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.max_position_embedding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.share_expert_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.share_q_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.norm_expert_weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3TextConfig.moe_layers_enum", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 38, "n_typed": 19, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 19, "n_attrs": 20, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.step3_vl", "names": [ "vllm.transformers_utils.configs.step3_vl.Step3TextConfig", "vllm.transformers_utils.configs.step3_vl.Step3VLConfig", "vllm.transformers_utils.configs.step3_vl.Step3VisionEncoderConfig" ], "n_typable": 73, "n_typed": 25, "n_any": 0, "n_untyped": 48, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 36, "n_classes": 3, "n_attrs": 38, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/step3p5.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.step3p5.Step3p5Config", "methods": [ { "kind": "function", "name": "Step3p5Config.__init__", "n_typed": 35, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 37, "n_params": 36, "n_function_overloads": 1, "n_function_params": 36 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Step3p5Config.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Step3p5Config.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.num_attention_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.num_attention_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.num_hidden_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.rms_norm_eps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.use_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.moe_intermediate_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.moe_every_n_layer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.moe_num_experts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.num_experts_per_tok", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.moe_top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.moe_layer_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.rope_theta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.rope_scaling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.norm_expert_weight", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.max_position_embeddings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.moe_router_activation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.moe_router_scaling_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.use_moe_router_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.need_fp32_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.att_impl_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.use_head_wise_attn_gate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.layer_types", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.use_rope_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.yarn_only_types", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.attention_other_setting", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.num_nextn_predict_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.swiglu_limits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.swiglu_limits_shared", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.bos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.eos_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Step3p5Config.share_expert_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 73, "n_typed": 35, "n_any": 0, "n_untyped": 38, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 36, "n_attrs": 37, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.step3p5", "names": [ "vllm.transformers_utils.configs.step3p5.Step3p5Config" ], "n_typable": 73, "n_typed": 35, "n_any": 0, "n_untyped": 38, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 36, "n_classes": 1, "n_attrs": 37, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/tarsier2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.tarsier2.Tarsier2Config", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Tarsier2Config.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.tarsier2", "names": [ "vllm.transformers_utils.configs.tarsier2.Tarsier2Config" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/configs/ultravox.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.configs.ultravox.UltravoxConfig", "methods": [ { "kind": "function", "name": "UltravoxConfig.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "UltravoxConfig.__setattr__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "UltravoxConfig.text_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "UltravoxConfig.wrapped_model_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxConfig.model_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UltravoxConfig.audio_token", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UltravoxConfig.is_composition", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UltravoxConfig.ignore_index", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxConfig.audio_token_index", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxConfig.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxConfig.stack_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxConfig.norm_init", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxConfig.projector_act", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxConfig.projector_ln_mid", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxConfig.num_projector_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxConfig.text_model_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxConfig.audio_model_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UltravoxConfig.audio_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 14, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 15, "n_attrs": 15, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.configs.ultravox", "names": [ "vllm.transformers_utils.configs.ultravox.UltravoxConfig" ], "n_typable": 30, "n_typed": 14, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 15, "n_classes": 1, "n_attrs": 15, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/dynamic_module.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.transformers_utils.dynamic_module.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.transformers_utils.dynamic_module.try_get_class_from_dynamic_module", "n_typed": 14, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 } ], "type_ignores": [], "name": "vllm.transformers_utils.dynamic_module", "names": [ "vllm.transformers_utils.dynamic_module.logger", "vllm.transformers_utils.dynamic_module.try_get_class_from_dynamic_module" ], "n_typable": 16, "n_typed": 14, "n_any": 0, "n_untyped": 2, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 14, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/gguf_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.transformers_utils.gguf_utils.detect_gguf_multimodal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.gguf_utils.maybe_patch_hf_config_from_gguf", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.transformers_utils.gguf_utils.is_remote_gguf", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.gguf_utils.is_gguf", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.gguf_utils.get_gguf_file_path_from_hf", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.transformers_utils.gguf_utils.check_gguf_file", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.gguf_utils.split_remote_gguf", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.gguf_utils.extract_vision_config_from_gguf", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.gguf_utils.is_valid_gguf_quant_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.gguf_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.gguf_utils", "names": [ "vllm.transformers_utils.gguf_utils.check_gguf_file", "vllm.transformers_utils.gguf_utils.detect_gguf_multimodal", "vllm.transformers_utils.gguf_utils.extract_vision_config_from_gguf", "vllm.transformers_utils.gguf_utils.get_gguf_file_path_from_hf", "vllm.transformers_utils.gguf_utils.is_gguf", "vllm.transformers_utils.gguf_utils.is_remote_gguf", "vllm.transformers_utils.gguf_utils.is_valid_gguf_quant_type", "vllm.transformers_utils.gguf_utils.logger", "vllm.transformers_utils.gguf_utils.maybe_patch_hf_config_from_gguf", "vllm.transformers_utils.gguf_utils.split_remote_gguf" ], "n_typable": 22, "n_typed": 21, "n_any": 0, "n_untyped": 1, "n_functions": 9, "n_function_overloads": 9, "n_function_params": 12, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/model_arch_config_convertor.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.MPTModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "MPTModelArchConfigConvertor.get_total_num_kv_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.LongCatFlashMTPModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "LongCatFlashMTPModelArchConfigConvertor.get_num_hidden_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.Qwen3_5MTPModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "Qwen3_5MTPModelArchConfigConvertor.get_num_hidden_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.FalconModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "FalconModelArchConfigConvertor.get_total_num_kv_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.TerratorchModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "TerratorchModelArchConfigConvertor.get_head_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TerratorchModelArchConfigConvertor.get_total_num_kv_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.GLM4MoeMTPModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "GLM4MoeMTPModelArchConfigConvertor.get_num_hidden_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.transformers_utils.model_arch_config_convertor.MODEL_ARCH_CONFIG_CONVERTORS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.DbrxModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "DbrxModelArchConfigConvertor.get_total_num_kv_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.Qwen3NextMTPModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "Qwen3NextMTPModelArchConfigConvertor.get_num_hidden_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.DeepSeekMTPModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "DeepSeekMTPModelArchConfigConvertor.get_num_hidden_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.ModelArchConfigConvertorBase", "methods": [ { "kind": "function", "name": "ModelArchConfigConvertorBase.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelArchConfigConvertorBase.get_architectures", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelArchConfigConvertorBase.get_num_hidden_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelArchConfigConvertorBase.get_total_num_attention_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelArchConfigConvertorBase.get_vocab_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelArchConfigConvertorBase.get_hidden_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelArchConfigConvertorBase.get_head_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelArchConfigConvertorBase.get_total_num_kv_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelArchConfigConvertorBase.get_num_experts_from_block_configs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelArchConfigConvertorBase.get_num_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelArchConfigConvertorBase.get_torch_dtype", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ModelArchConfigConvertorBase._normalize_quantization_config", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelArchConfigConvertorBase.get_quantization_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelArchConfigConvertorBase.is_deepseek_mla", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelArchConfigConvertorBase.derive_max_model_len_and_key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelArchConfigConvertorBase.convert", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelArchConfigConvertorBase.hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelArchConfigConvertorBase.hf_text_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 19, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.MimoMTPModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "MimoMTPModelArchConfigConvertor.get_num_hidden_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.Zamba2ModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "Zamba2ModelArchConfigConvertor.get_head_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.ErnieMTPModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "ErnieMTPModelArchConfigConvertor.get_num_hidden_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.PanguUltraMoeMTPModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "PanguUltraMoeMTPModelArchConfigConvertor.get_num_hidden_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.NemotronNasModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "NemotronNasModelArchConfigConvertor.get_total_num_kv_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.MambaModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "MambaModelArchConfigConvertor.get_head_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MambaModelArchConfigConvertor.get_total_num_kv_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.model_arch_config_convertor.MedusaModelArchConfigConvertor", "methods": [ { "kind": "function", "name": "MedusaModelArchConfigConvertor.get_head_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MedusaModelArchConfigConvertor.get_total_num_kv_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.transformers_utils.model_arch_config_convertor.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.model_arch_config_convertor", "names": [ "vllm.transformers_utils.model_arch_config_convertor.DbrxModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.DeepSeekMTPModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.ErnieMTPModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.FalconModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.GLM4MoeMTPModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.LongCatFlashMTPModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.MODEL_ARCH_CONFIG_CONVERTORS", "vllm.transformers_utils.model_arch_config_convertor.MPTModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.MambaModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.MedusaModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.MimoMTPModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.ModelArchConfigConvertorBase", "vllm.transformers_utils.model_arch_config_convertor.NemotronNasModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.PanguUltraMoeMTPModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.Qwen3NextMTPModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.Qwen3_5MTPModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.TerratorchModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.Zamba2ModelArchConfigConvertor", "vllm.transformers_utils.model_arch_config_convertor.logger" ], "n_typable": 45, "n_typed": 38, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 35, "n_method_overloads": 35, "n_method_params": 7, "n_classes": 17, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/processor.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.transformers_utils.processor.cached_get_feature_extractor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.processor.cached_get_image_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.transformers_utils.processor.cached_image_processor_from_config", "n_typed": 1, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.transformers_utils.processor.get_processor_kwargs_keys", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.processor.get_image_processor", "n_typed": 3, "n_any": 2, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.transformers_utils.processor.get_processor_kwargs_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.processor.get_feature_extractor", "n_typed": 3, "n_any": 2, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.transformers_utils.processor.cached_processor_from_config", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.transformers_utils.processor.HashableList", "methods": [ { "kind": "function", "name": "HashableList.__hash__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.transformers_utils.processor.cached_video_processor_from_config", "n_typed": 2, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.transformers_utils.processor.cached_get_processor_without_dynamic_kwargs", "n_typed": 5, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.transformers_utils.processor.get_video_processor", "n_typed": 4, "n_any": 2, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "class", "name": "vllm.transformers_utils.processor.HashableDict", "methods": [ { "kind": "function", "name": "HashableDict.__hash__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.transformers_utils.processor.cached_get_video_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.transformers_utils.processor.cached_feature_extractor_from_config", "n_typed": 1, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.transformers_utils.processor.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.transformers_utils.processor.get_processor", "n_typed": 5, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "attr", "name": "vllm.transformers_utils.processor.cached_get_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [ { "kind": "type", "rules": [ "override" ] }, { "kind": "type", "rules": [ "override" ] } ], "name": "vllm.transformers_utils.processor", "names": [ "vllm.transformers_utils.processor.HashableDict", "vllm.transformers_utils.processor.HashableList", "vllm.transformers_utils.processor.cached_feature_extractor_from_config", "vllm.transformers_utils.processor.cached_get_feature_extractor", "vllm.transformers_utils.processor.cached_get_image_processor", "vllm.transformers_utils.processor.cached_get_processor", "vllm.transformers_utils.processor.cached_get_processor_without_dynamic_kwargs", "vllm.transformers_utils.processor.cached_get_video_processor", "vllm.transformers_utils.processor.cached_image_processor_from_config", "vllm.transformers_utils.processor.cached_processor_from_config", "vllm.transformers_utils.processor.cached_video_processor_from_config", "vllm.transformers_utils.processor.get_feature_extractor", "vllm.transformers_utils.processor.get_image_processor", "vllm.transformers_utils.processor.get_processor", "vllm.transformers_utils.processor.get_processor_kwargs_keys", "vllm.transformers_utils.processor.get_processor_kwargs_type", "vllm.transformers_utils.processor.get_video_processor", "vllm.transformers_utils.processor.logger" ], "n_typable": 58, "n_typed": 33, "n_any": 14, "n_untyped": 11, "n_functions": 11, "n_function_overloads": 11, "n_function_params": 40, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_classes": 2, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 2 }, { "path": "vllm/transformers_utils/processors/hunyuan_vl.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.processors.hunyuan_vl.HunYuanVLProcessor", "methods": [ { "kind": "function", "name": "HunYuanVLProcessor.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "HunYuanVLProcessor.__call__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "HunYuanVLProcessor.batch_decode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunYuanVLProcessor.decode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunYuanVLProcessor.post_process_image_text_to_text", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "HunYuanVLProcessor.apply_chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "HunYuanVLProcessor.get_imgs_pos", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "HunYuanVLProcessor.model_input_names", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "HunYuanVLProcessor.attributes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "HunYuanVLProcessor.valid_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "HunYuanVLProcessor.image_processor_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "HunYuanVLProcessor.tokenizer_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "HunYuanVLProcessor.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLProcessor.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLProcessor.image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLProcessor.im_start_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLProcessor.im_start_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLProcessor.im_end_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLProcessor.im_end_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLProcessor.placeholder_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLProcessor.pad_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 36, "n_typed": 4, "n_any": 0, "n_untyped": 32, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 19, "n_attrs": 13, "n_properties": 1 }, { "kind": "function", "name": "vllm.transformers_utils.processors.hunyuan_vl.split_image_into_patch_blocks", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.transformers_utils.processors.hunyuan_vl", "names": [ "vllm.transformers_utils.processors.hunyuan_vl.HunYuanVLProcessor", "vllm.transformers_utils.processors.hunyuan_vl.split_image_into_patch_blocks" ], "n_typable": 40, "n_typed": 8, "n_any": 0, "n_untyped": 32, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 19, "n_classes": 1, "n_attrs": 13, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/processors/deepseek_vl2.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.processors.deepseek_vl2.DeepseekVLV2Processor", "methods": [ { "kind": "function", "name": "DeepseekVLV2Processor.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "DeepseekVLV2Processor.select_best_resolution", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeepseekVLV2Processor.encode", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepseekVLV2Processor.decode", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekVLV2Processor.process_one", "n_typed": 3, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepseekVLV2Processor.__call__", "n_typed": 3, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepseekVLV2Processor.tokenize_with_images", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [ { "kind": "property", "name": "DeepseekVLV2Processor.bos_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "DeepseekVLV2Processor.eos_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "DeepseekVLV2Processor.pad_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "DeepseekVLV2Processor.tokenizer_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekVLV2Processor.attributes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekVLV2Processor.candidate_resolutions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Processor.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Processor.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Processor.image_mean", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Processor.image_std", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Processor.normalize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Processor.downsample_ratio", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Processor.image_transform", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Processor.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Processor.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Processor.image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Processor.pad_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Processor.add_special_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Processor.sft_format", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Processor.mask_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekVLV2Processor.ignore_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 59, "n_typed": 29, "n_any": 2, "n_untyped": 28, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 33, "n_attrs": 18, "n_properties": 3 }, { "kind": "class", "name": "vllm.transformers_utils.processors.deepseek_vl2.ImageTransform", "methods": [ { "kind": "function", "name": "ImageTransform.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ImageTransform.__call__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ImageTransform.mean", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageTransform.std", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageTransform.normalize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageTransform.transform", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 4, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.processors.deepseek_vl2", "names": [ "vllm.transformers_utils.processors.deepseek_vl2.DeepseekVLV2Processor", "vllm.transformers_utils.processors.deepseek_vl2.ImageTransform" ], "n_typable": 69, "n_typed": 33, "n_any": 2, "n_untyped": 34, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 37, "n_classes": 2, "n_attrs": 22, "n_properties": 3, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/processors/ovis.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.processors.ovis.OvisProcessor", "methods": [ { "kind": "function", "name": "OvisProcessor.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "OvisProcessor.__call__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OvisProcessor._tokenize_with_image_symbol", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OvisProcessor.get_image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OvisProcessor.get_token_value", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OvisProcessor.construct_image_indicators", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OvisProcessor.construct_image_placeholders", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OvisProcessor.preprocess_image", "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OvisProcessor.batch_decode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OvisProcessor.decode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OvisProcessor.post_process_image_text_to_text", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "OvisProcessor.extra_special_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "OvisProcessor.model_input_names", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "OvisProcessor.attributes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OvisProcessor.valid_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OvisProcessor.image_processor_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OvisProcessor.tokenizer_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OvisProcessor.image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OvisProcessor.image_pad_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OvisProcessor.image_segment_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 39, "n_typed": 7, "n_any": 0, "n_untyped": 32, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 23, "n_attrs": 7, "n_properties": 2 } ], "type_ignores": [ { "kind": "type", "rules": [ "call-arg" ] } ], "name": "vllm.transformers_utils.processors.ovis", "names": [ "vllm.transformers_utils.processors.ovis.OvisProcessor" ], "n_typable": 39, "n_typed": 7, "n_any": 0, "n_untyped": 32, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 23, "n_classes": 1, "n_attrs": 7, "n_properties": 2, "n_type_ignores": 1 }, { "path": "vllm/transformers_utils/processors/fireredasr2_processor.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.processors.fireredasr2_processor.FireRedASR2Processor", "methods": [ { "kind": "function", "name": "FireRedASR2Processor.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FireRedASR2Processor.get_decoder_prompt_ids", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FireRedASR2Processor.__call__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FireRedASR2Processor.get_prompt_ids", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FireRedASR2Processor.feature_extractor_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FireRedASR2Processor.tokenizer_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FireRedASR2Processor.current_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2Processor.audio_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2Processor.audio_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 1, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.processors.fireredasr2_processor.CMVN", "methods": [ { "kind": "function", "name": "CMVN.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CMVN.__call__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.transformers_utils.processors.fireredasr2_processor.FireRedASR2FeatureExtractor", "methods": [ { "kind": "function", "name": "FireRedASR2FeatureExtractor.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 18, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 }, { "kind": "function", "name": "FireRedASR2FeatureExtractor.__call__", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FireRedASR2FeatureExtractor.model_input_names", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FireRedASR2FeatureExtractor.chunk_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2FeatureExtractor.max_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2FeatureExtractor.dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2FeatureExtractor.means", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2FeatureExtractor.inverse_std_variences", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2FeatureExtractor.num_mel_bins", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2FeatureExtractor.frame_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2FeatureExtractor.frame_shift", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2FeatureExtractor.dither", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2FeatureExtractor.sampling_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2FeatureExtractor.downsample_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FireRedASR2FeatureExtractor.context", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 41, "n_typed": 10, "n_any": 0, "n_untyped": 31, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 27, "n_attrs": 13, "n_properties": 0 }, { "kind": "attr", "name": "vllm.transformers_utils.processors.fireredasr2_processor.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.transformers_utils.processors.fireredasr2_processor.KaldifeatFbank", "methods": [ { "kind": "function", "name": "KaldifeatFbank.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KaldifeatFbank.__call__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KaldifeatFbank.dither", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KaldifeatFbank.opts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 0, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.processors.fireredasr2_processor", "names": [ "vllm.transformers_utils.processors.fireredasr2_processor.CMVN", "vllm.transformers_utils.processors.fireredasr2_processor.FireRedASR2FeatureExtractor", "vllm.transformers_utils.processors.fireredasr2_processor.FireRedASR2Processor", "vllm.transformers_utils.processors.fireredasr2_processor.KaldifeatFbank", "vllm.transformers_utils.processors.fireredasr2_processor.logger" ], "n_typable": 76, "n_typed": 11, "n_any": 0, "n_untyped": 65, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 48, "n_classes": 4, "n_attrs": 21, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/processors/funasr_processor.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.processors.funasr_processor.FunASRProcessor", "methods": [ { "kind": "function", "name": "FunASRProcessor.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FunASRProcessor.get_decoder_prompt_ids", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FunASRProcessor.__call__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FunASRProcessor.get_prompt_ids", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FunASRProcessor.feature_extractor_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FunASRProcessor.tokenizer_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FunASRProcessor.current_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRProcessor.audio_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRProcessor.audio_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 1, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 10, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.transformers_utils.processors.funasr_processor.apply_lfr", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.transformers_utils.processors.funasr_processor.apply_cmvn", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.transformers_utils.processors.funasr_processor.FunASRFeatureExtractor", "methods": [ { "kind": "function", "name": "FunASRFeatureExtractor.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "FunASRFeatureExtractor.extract_fbank", "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FunASRFeatureExtractor.__call__", "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FunASRFeatureExtractor.model_input_names", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FunASRFeatureExtractor.frontend_conf", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRFeatureExtractor.n_fft", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRFeatureExtractor.hop_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRFeatureExtractor.chunk_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRFeatureExtractor.n_samples", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRFeatureExtractor.nb_max_frames", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRFeatureExtractor.sampling_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FunASRFeatureExtractor.dither", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 37, "n_typed": 13, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 26, "n_attrs": 9, "n_properties": 0 }, { "kind": "function", "name": "vllm.transformers_utils.processors.funasr_processor.load_cmvn", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.transformers_utils.processors.funasr_processor.WavFrontend", "methods": [ { "kind": "function", "name": "WavFrontend.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "WavFrontend.output_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WavFrontend.forward", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "WavFrontend.forward_fbank", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WavFrontend.forward_lfr_cmvn", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WavFrontend.fs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WavFrontend.window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WavFrontend.n_mels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WavFrontend.frame_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WavFrontend.frame_shift", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WavFrontend.filter_length_min", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WavFrontend.filter_length_max", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WavFrontend.lfr_m", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WavFrontend.lfr_n", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WavFrontend.cmvn_file", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WavFrontend.dither", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WavFrontend.snip_edges", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WavFrontend.upsacle_samples", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WavFrontend.cmvn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 22, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 21, "n_attrs": 14, "n_properties": 0 }, { "kind": "attr", "name": "vllm.transformers_utils.processors.funasr_processor.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.processors.funasr_processor", "names": [ "vllm.transformers_utils.processors.funasr_processor.FunASRFeatureExtractor", "vllm.transformers_utils.processors.funasr_processor.FunASRProcessor", "vllm.transformers_utils.processors.funasr_processor.WavFrontend", "vllm.transformers_utils.processors.funasr_processor.apply_cmvn", "vllm.transformers_utils.processors.funasr_processor.apply_lfr", "vllm.transformers_utils.processors.funasr_processor.load_cmvn", "vllm.transformers_utils.processors.funasr_processor.logger" ], "n_typable": 104, "n_typed": 36, "n_any": 0, "n_untyped": 68, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 6, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 57, "n_classes": 3, "n_attrs": 29, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/processors/ovis2_5.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.processors.ovis2_5.Ovis2_5Processor", "methods": [ { "kind": "function", "name": "Ovis2_5Processor.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 9, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "Ovis2_5Processor.__call__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Ovis2_5Processor._tokenize_with_visual_symbol", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis2_5Processor.smart_resize", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Ovis2_5Processor.get_token_value", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Ovis2_5Processor.construct_visual_indicators", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ovis2_5Processor.construct_visual_placeholders", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Ovis2_5Processor.preprocess_multidata", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [ { "kind": "property", "name": "Ovis2_5Processor.extra_special_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Ovis2_5Processor.attributes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Ovis2_5Processor.valid_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Ovis2_5Processor.image_processor_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Ovis2_5Processor.tokenizer_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Ovis2_5Processor.image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5Processor.video_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5Processor.image_pad_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5Processor.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5Processor.hidden_stride", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Ovis2_5Processor.temporal_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 44, "n_typed": 20, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 29, "n_attrs": 10, "n_properties": 1 } ], "type_ignores": [ { "kind": "type", "rules": [ "call-arg" ] } ], "name": "vllm.transformers_utils.processors.ovis2_5", "names": [ "vllm.transformers_utils.processors.ovis2_5.Ovis2_5Processor" ], "n_typable": 44, "n_typed": 20, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 29, "n_classes": 1, "n_attrs": 10, "n_properties": 1, "n_type_ignores": 1 }, { "path": "vllm/transformers_utils/processors/bagel.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.processors.bagel.BagelProcessor", "methods": [ { "kind": "function", "name": "BagelProcessor.__call__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BagelProcessor.batch_decode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BagelProcessor.decode", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "BagelProcessor.model_input_names", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "BagelProcessor.attributes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BagelProcessor.image_processor_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BagelProcessor.tokenizer_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 11, "n_typed": 3, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 3, "n_properties": 1 }, { "kind": "class", "name": "vllm.transformers_utils.processors.bagel.BagelProcessorKwargs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "BagelProcessorKwargs._defaults", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": [ "call-arg" ] } ], "name": "vllm.transformers_utils.processors.bagel", "names": [ "vllm.transformers_utils.processors.bagel.BagelProcessor", "vllm.transformers_utils.processors.bagel.BagelProcessorKwargs" ], "n_typable": 11, "n_typed": 3, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_classes": 2, "n_attrs": 4, "n_properties": 1, "n_type_ignores": 1 }, { "path": "vllm/transformers_utils/processors/hunyuan_vl_image.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.processors.hunyuan_vl_image.HunYuanVLImageProcessor", "methods": [ { "kind": "function", "name": "HunYuanVLImageProcessor.__init__", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "HunYuanVLImageProcessor._preprocess", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "HunYuanVLImageProcessor.preprocess", "n_typed": 19, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 20, "n_params": 19, "n_function_overloads": 1, "n_function_params": 19 }, { "kind": "function", "name": "HunYuanVLImageProcessor.get_number_of_image_patches", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HunYuanVLImageProcessor.model_input_names", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "HunYuanVLImageProcessor.min_pixels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImageProcessor.max_pixels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImageProcessor.size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImageProcessor.do_resize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImageProcessor.resample", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImageProcessor.do_rescale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImageProcessor.rescale_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImageProcessor.do_normalize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImageProcessor.image_mean", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImageProcessor.image_std", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImageProcessor.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImageProcessor.temporal_patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImageProcessor.merge_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "HunYuanVLImageProcessor.do_convert_rgb", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 70, "n_typed": 51, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 52, "n_attrs": 15, "n_properties": 0 }, { "kind": "function", "name": "vllm.transformers_utils.processors.hunyuan_vl_image.smart_resize", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.transformers_utils.processors.hunyuan_vl_image.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.processors.hunyuan_vl_image", "names": [ "vllm.transformers_utils.processors.hunyuan_vl_image.HunYuanVLImageProcessor", "vllm.transformers_utils.processors.hunyuan_vl_image.logger", "vllm.transformers_utils.processors.hunyuan_vl_image.smart_resize" ], "n_typable": 77, "n_typed": 56, "n_any": 0, "n_untyped": 21, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 5, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 52, "n_classes": 1, "n_attrs": 16, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/processors/deepseek_ocr.py", "symbol_reports": [ { "kind": "function", "name": "vllm.transformers_utils.processors.deepseek_ocr.find_closest_aspect_ratio", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.transformers_utils.processors.deepseek_ocr.calculate_aspect_ratios", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.transformers_utils.processors.deepseek_ocr.BASE_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.transformers_utils.processors.deepseek_ocr.MAX_CROPS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.transformers_utils.processors.deepseek_ocr.CROP_MODE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.transformers_utils.processors.deepseek_ocr.ImageTransform", "methods": [ { "kind": "function", "name": "ImageTransform.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ImageTransform.__call__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ImageTransform.mean", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageTransform.std", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageTransform.normalize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ImageTransform.transform", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 4, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.transformers_utils.processors.deepseek_ocr.count_tiles", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.transformers_utils.processors.deepseek_ocr.dynamic_preprocess", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.transformers_utils.processors.deepseek_ocr.DeepseekOCRProcessor", "methods": [ { "kind": "function", "name": "DeepseekOCRProcessor.__init__", "n_typed": 15, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "DeepseekOCRProcessor.encode", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepseekOCRProcessor.decode", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekOCRProcessor.process_one", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DeepseekOCRProcessor.__call__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DeepseekOCRProcessor.tokenize_with_images", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [ { "kind": "property", "name": "DeepseekOCRProcessor.bos_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "DeepseekOCRProcessor.eos_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "property", "name": "DeepseekOCRProcessor.pad_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "DeepseekOCRProcessor.tokenizer_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekOCRProcessor.attributes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekOCRProcessor.image_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.base_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.strategy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.patch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.image_mean", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.image_std", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.normalize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.downsample_ratio", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.image_transform", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.image_token_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.image_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.pad_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.add_special_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.sft_format", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.mask_prompt", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekOCRProcessor.ignore_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 59, "n_typed": 31, "n_any": 0, "n_untyped": 28, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 33, "n_attrs": 19, "n_properties": 3 }, { "kind": "attr", "name": "vllm.transformers_utils.processors.deepseek_ocr.MIN_CROPS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.transformers_utils.processors.deepseek_ocr.IMAGE_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.processors.deepseek_ocr", "names": [ "vllm.transformers_utils.processors.deepseek_ocr.BASE_SIZE", "vllm.transformers_utils.processors.deepseek_ocr.CROP_MODE", "vllm.transformers_utils.processors.deepseek_ocr.DeepseekOCRProcessor", "vllm.transformers_utils.processors.deepseek_ocr.IMAGE_SIZE", "vllm.transformers_utils.processors.deepseek_ocr.ImageTransform", "vllm.transformers_utils.processors.deepseek_ocr.MAX_CROPS", "vllm.transformers_utils.processors.deepseek_ocr.MIN_CROPS", "vllm.transformers_utils.processors.deepseek_ocr.calculate_aspect_ratios", "vllm.transformers_utils.processors.deepseek_ocr.count_tiles", "vllm.transformers_utils.processors.deepseek_ocr.dynamic_preprocess", "vllm.transformers_utils.processors.deepseek_ocr.find_closest_aspect_ratio" ], "n_typable": 91, "n_typed": 38, "n_any": 0, "n_untyped": 53, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 18, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 37, "n_classes": 2, "n_attrs": 28, "n_properties": 3, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/processors/qwen3_asr.py", "symbol_reports": [ { "kind": "class", "name": "vllm.transformers_utils.processors.qwen3_asr.Qwen3ASRProcessor", "methods": [ { "kind": "function", "name": "Qwen3ASRProcessor.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3ASRProcessor.__call__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Qwen3ASRProcessor.replace_multimodal_special_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3ASRProcessor.get_chunked_index", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Qwen3ASRProcessor.apply_chat_template", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "Qwen3ASRProcessor.model_input_names", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Qwen3ASRProcessor.attributes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3ASRProcessor.feature_extractor_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3ASRProcessor.tokenizer_class", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Qwen3ASRProcessor.audio_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRProcessor.audio_bos_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Qwen3ASRProcessor.audio_eos_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 6, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_attrs": 6, "n_properties": 1 }, { "kind": "class", "name": "vllm.transformers_utils.processors.qwen3_asr.Qwen3ASRProcessorKwargs", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Qwen3ASRProcessorKwargs._defaults", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.transformers_utils.processors.qwen3_asr", "names": [ "vllm.transformers_utils.processors.qwen3_asr.Qwen3ASRProcessor", "vllm.transformers_utils.processors.qwen3_asr.Qwen3ASRProcessorKwargs" ], "n_typable": 22, "n_typed": 6, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_classes": 2, "n_attrs": 7, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/repo_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.transformers_utils.repo_utils.get_hf_file_bytes", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.transformers_utils.repo_utils.file_exists", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.transformers_utils.repo_utils.list_repo_files", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.transformers_utils.repo_utils.file_or_path_exists", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.transformers_utils.repo_utils.list_filtered_repo_files", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.transformers_utils.repo_utils.is_mistral_model_repo", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.transformers_utils.repo_utils.try_get_local_file", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.transformers_utils.repo_utils.any_pattern_in_repo_files", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.transformers_utils.repo_utils.with_retry", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.transformers_utils.repo_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.transformers_utils.repo_utils.get_model_path", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.transformers_utils.repo_utils.get_hf_file_to_dict", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.transformers_utils.repo_utils", "names": [ "vllm.transformers_utils.repo_utils.any_pattern_in_repo_files", "vllm.transformers_utils.repo_utils.file_exists", "vllm.transformers_utils.repo_utils.file_or_path_exists", "vllm.transformers_utils.repo_utils.get_hf_file_bytes", "vllm.transformers_utils.repo_utils.get_hf_file_to_dict", "vllm.transformers_utils.repo_utils.get_model_path", "vllm.transformers_utils.repo_utils.is_mistral_model_repo", "vllm.transformers_utils.repo_utils.list_filtered_repo_files", "vllm.transformers_utils.repo_utils.list_repo_files", "vllm.transformers_utils.repo_utils.logger", "vllm.transformers_utils.repo_utils.try_get_local_file", "vllm.transformers_utils.repo_utils.with_retry" ], "n_typable": 53, "n_typed": 49, "n_any": 0, "n_untyped": 4, "n_functions": 11, "n_function_overloads": 11, "n_function_params": 41, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/transformers_utils/runai_utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.transformers_utils.runai_utils.SUPPORTED_SCHEMES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.transformers_utils.runai_utils.runai_pull_files", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.transformers_utils.runai_utils.list_safetensors", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.runai_utils.runai_model_streamer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.transformers_utils.runai_utils.is_runai_obj_uri", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.runai_utils.runai_list_safetensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.runai_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.transformers_utils.runai_utils.ObjectStorageModel", "methods": [ { "kind": "function", "name": "ObjectStorageModel.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ObjectStorageModel._close", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ObjectStorageModel._close_by_signal", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ObjectStorageModel.pull_files", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ObjectStorageModel.dir", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 7, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": [ "assignment" ] } ], "name": "vllm.transformers_utils.runai_utils", "names": [ "vllm.transformers_utils.runai_utils.ObjectStorageModel", "vllm.transformers_utils.runai_utils.SUPPORTED_SCHEMES", "vllm.transformers_utils.runai_utils.is_runai_obj_uri", "vllm.transformers_utils.runai_utils.list_safetensors", "vllm.transformers_utils.runai_utils.logger", "vllm.transformers_utils.runai_utils.runai_list_safetensors", "vllm.transformers_utils.runai_utils.runai_model_streamer", "vllm.transformers_utils.runai_utils.runai_pull_files" ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 2, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/transformers_utils/s3_utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.transformers_utils.s3_utils.boto3", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.transformers_utils.s3_utils.list_files", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.transformers_utils.s3_utils.glob", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [ { "kind": "type", "rules": [ "assignment" ] } ], "name": "vllm.transformers_utils.s3_utils", "names": [ "vllm.transformers_utils.s3_utils.boto3", "vllm.transformers_utils.s3_utils.glob", "vllm.transformers_utils.s3_utils.list_files" ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/transformers_utils/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.transformers_utils.utils.is_gcs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.utils.maybe_model_redirect", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.utils.is_s3", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.utils.convert_model_repo_to_path", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.transformers_utils.utils.modelscope_list_repo_files", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.transformers_utils.utils.parse_safetensors_file_metadata", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.transformers_utils.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.transformers_utils.utils.is_cloud_storage", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.transformers_utils.utils", "names": [ "vllm.transformers_utils.utils.convert_model_repo_to_path", "vllm.transformers_utils.utils.is_cloud_storage", "vllm.transformers_utils.utils.is_gcs", "vllm.transformers_utils.utils.is_s3", "vllm.transformers_utils.utils.logger", "vllm.transformers_utils.utils.maybe_model_redirect", "vllm.transformers_utils.utils.modelscope_list_repo_files", "vllm.transformers_utils.utils.parse_safetensors_file_metadata" ], "n_typable": 17, "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 9, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/triton_utils/__init__.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.triton_utils.tldevice", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.triton_utils.tl", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.triton_utils.triton", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.triton_utils", "names": [ "vllm.triton_utils.tl", "vllm.triton_utils.tldevice", "vllm.triton_utils.triton" ], "n_typable": 3, "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/triton_utils/importing.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.triton_utils.importing.HAS_TRITON", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.triton_utils.importing.active_drivers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.triton_utils.importing.TritonPlaceholder", "methods": [ { "kind": "function", "name": "TritonPlaceholder.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonPlaceholder._dummy_decorator", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TritonPlaceholder.jit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonPlaceholder.autotune", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonPlaceholder.heuristics", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonPlaceholder.Config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonPlaceholder.language", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.triton_utils.importing.TritonLanguagePlaceholder", "methods": [ { "kind": "function", "name": "TritonLanguagePlaceholder.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TritonLanguagePlaceholder.constexpr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonLanguagePlaceholder.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonLanguagePlaceholder.int64", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonLanguagePlaceholder.int32", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonLanguagePlaceholder.tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonLanguagePlaceholder.exp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonLanguagePlaceholder.log", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonLanguagePlaceholder.log2", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 0, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.triton_utils.importing.cuda_visible_devices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.triton_utils.importing.is_distributed_env", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.triton_utils.importing.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.triton_utils.importing", "names": [ "vllm.triton_utils.importing.HAS_TRITON", "vllm.triton_utils.importing.TritonLanguagePlaceholder", "vllm.triton_utils.importing.TritonPlaceholder", "vllm.triton_utils.importing.active_drivers", "vllm.triton_utils.importing.cuda_visible_devices", "vllm.triton_utils.importing.is_distributed_env", "vllm.triton_utils.importing.logger" ], "n_typable": 22, "n_typed": 0, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_classes": 2, "n_attrs": 18, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/triton_utils/allocation.py", "symbol_reports": [ { "kind": "function", "name": "vllm.triton_utils.allocation.set_triton_allocator", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.triton_utils.allocation", "names": [ "vllm.triton_utils.allocation.set_triton_allocator" ], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/usage/usage_lib.py", "symbol_reports": [ { "kind": "function", "name": "vllm.usage.usage_lib.set_runtime_usage_data", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.usage.usage_lib.UsageMessage", "methods": [ { "kind": "function", "name": "UsageMessage.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UsageMessage.report_usage", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "UsageMessage._report_usage_worker", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "UsageMessage._report_tpu_inference_usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UsageMessage._report_usage_once", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "UsageMessage._report_continuous_usage", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UsageMessage._send_to_server", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UsageMessage._write_to_file", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "UsageMessage.uuid", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.provider", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.num_cpu", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.cpu_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.cpu_family_model_stepping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.total_memory", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.architecture", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.platform", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.cuda_runtime", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.gpu_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.gpu_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.gpu_memory_per_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.env_var_json", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.model_architecture", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.vllm_version", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.context", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.log_time", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UsageMessage.source", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 37, "n_typed": 35, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 11, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.usage.usage_lib.UsageContext", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "UsageContext.UNKNOWN_CONTEXT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UsageContext.LLM_CLASS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UsageContext.API_SERVER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UsageContext.OPENAI_API_SERVER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UsageContext.OPENAI_BATCH_RUNNER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UsageContext.ENGINE_CONTEXT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.usage.usage_lib.is_usage_stats_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.usage.usage_lib.usage_message", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.usage.usage_lib.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.usage.usage_lib", "names": [ "vllm.usage.usage_lib.UsageContext", "vllm.usage.usage_lib.UsageMessage", "vllm.usage.usage_lib.is_usage_stats_enabled", "vllm.usage.usage_lib.logger", "vllm.usage.usage_lib.set_runtime_usage_data", "vllm.usage.usage_lib.usage_message" ], "n_typable": 43, "n_typed": 38, "n_any": 0, "n_untyped": 5, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 2, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 11, "n_classes": 2, "n_attrs": 26, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/__init__.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.utils.MASK_64_BITS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.utils.random_uuid", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.length_from_prompt_token_ids_or_embeds", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.utils", "names": [ "vllm.utils.MASK_64_BITS", "vllm.utils.length_from_prompt_token_ids_or_embeds", "vllm.utils.random_uuid" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 2, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/argparse_utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.utils.argparse_utils.SortedHelpFormatter", "methods": [ { "kind": "function", "name": "SortedHelpFormatter._split_lines", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SortedHelpFormatter.add_arguments", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.utils.argparse_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.utils.argparse_utils.FlexibleArgumentParser", "methods": [ { "kind": "function", "name": "FlexibleArgumentParser.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlexibleArgumentParser.format_help", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlexibleArgumentParser.parse_args", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlexibleArgumentParser.check_port", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlexibleArgumentParser._pull_args_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlexibleArgumentParser.load_config_file", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlexibleArgumentParser._deprecated", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlexibleArgumentParser._json_tip", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlexibleArgumentParser._search_keyword", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlexibleArgumentParser.add_json_tip", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 9, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 7, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.utils.argparse_utils", "names": [ "vllm.utils.argparse_utils.FlexibleArgumentParser", "vllm.utils.argparse_utils.SortedHelpFormatter", "vllm.utils.argparse_utils.logger" ], "n_typable": 23, "n_typed": 9, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 10, "n_classes": 2, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/async_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.async_utils.make_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.async_utils.merge_async_iterators", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.utils.async_utils.P", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.utils.async_utils.in_loop", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.utils.async_utils.AsyncMicrobatchTokenizer", "methods": [ { "kind": "function", "name": "AsyncMicrobatchTokenizer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AsyncMicrobatchTokenizer.__call__", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMicrobatchTokenizer.encode", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMicrobatchTokenizer.decode", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMicrobatchTokenizer._get_queue", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMicrobatchTokenizer._batch_encode_loop", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMicrobatchTokenizer._batch_decode_loop", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncMicrobatchTokenizer._queue_key", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMicrobatchTokenizer.__del__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AsyncMicrobatchTokenizer.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncMicrobatchTokenizer.max_batch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncMicrobatchTokenizer.batch_wait_timeout_s", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 15, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 16, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.utils.async_utils.T", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.utils.async_utils.cancel_task_threadsafe", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.async_utils.run_in_loop", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.utils.async_utils.anext", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.async_utils.collect_from_async_generator", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.utils.async_utils", "names": [ "vllm.utils.async_utils.AsyncMicrobatchTokenizer", "vllm.utils.async_utils.P", "vllm.utils.async_utils.T", "vllm.utils.async_utils.anext", "vllm.utils.async_utils.cancel_task_threadsafe", "vllm.utils.async_utils.collect_from_async_generator", "vllm.utils.async_utils.in_loop", "vllm.utils.async_utils.make_async", "vllm.utils.async_utils.merge_async_iterators", "vllm.utils.async_utils.run_in_loop" ], "n_typable": 45, "n_typed": 28, "n_any": 0, "n_untyped": 17, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 10, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 16, "n_classes": 1, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/cache.py", "symbol_reports": [ { "kind": "class", "name": "vllm.utils.cache.LRUCache", "methods": [ { "kind": "function", "name": "LRUCache.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LRUCache.__getitem__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LRUCache.__delitem__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUCache.stat", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUCache.touch", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUCache.get", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 3, "n_params": 2, "n_function_overloads": 2, "n_function_params": 2 }, { "kind": "function", "name": "LRUCache.pop", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 3, "n_params": 2, "n_function_overloads": 2, "n_function_params": 2 }, { "kind": "function", "name": "LRUCache.put", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LRUCache.pin", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUCache._unpin", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUCache._on_remove", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LRUCache.remove_oldest", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUCache._remove_old_if_needed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LRUCache.popitem", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUCache.clear", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "LRUCache.cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "LRUCache.order", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "LRUCache.capacity", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "LRUCache.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "LRUCache.pinned_items", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 39, "n_typed": 36, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 17, "n_method_params": 19, "n_attrs": 1, "n_properties": 4 }, { "kind": "attr", "name": "vllm.utils.cache.ALL_PINNED_SENTINEL", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.utils.cache.CacheInfo", "methods": [ { "kind": "function", "name": "CacheInfo.__sub__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "CacheInfo.hit_ratio", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "CacheInfo.hits", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CacheInfo.total", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.utils.cache", "names": [ "vllm.utils.cache.ALL_PINNED_SENTINEL", "vllm.utils.cache.CacheInfo", "vllm.utils.cache.LRUCache" ], "n_typable": 43, "n_typed": 38, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 18, "n_method_params": 20, "n_classes": 2, "n_attrs": 4, "n_properties": 5, "n_type_ignores": 0 }, { "path": "vllm/utils/collection_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.collection_utils.as_list", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.collection_utils.chunk_list", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.collection_utils.is_list_of", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.utils.collection_utils.LazyDict", "methods": [ { "kind": "function", "name": "LazyDict.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LazyDict.__getitem__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LazyDict.__setitem__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LazyDict.__iter__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LazyDict.__len__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 5, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.utils.collection_utils.flatten_2d_lists", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.collection_utils.swap_dict_values", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.utils.collection_utils.T", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.utils.collection_utils.common_prefix", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.collection_utils.full_groupby", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.utils.collection_utils", "names": [ "vllm.utils.collection_utils.LazyDict", "vllm.utils.collection_utils.T", "vllm.utils.collection_utils.as_list", "vllm.utils.collection_utils.chunk_list", "vllm.utils.collection_utils.common_prefix", "vllm.utils.collection_utils.flatten_2d_lists", "vllm.utils.collection_utils.full_groupby", "vllm.utils.collection_utils.is_list_of", "vllm.utils.collection_utils.swap_dict_values" ], "n_typable": 29, "n_typed": 24, "n_any": 0, "n_untyped": 5, "n_functions": 7, "n_function_overloads": 8, "n_function_params": 13, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/counter.py", "symbol_reports": [ { "kind": "class", "name": "vllm.utils.counter.Counter", "methods": [ { "kind": "function", "name": "Counter.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Counter.__next__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Counter.reset", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Counter.counter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.utils.counter.AtomicCounter", "methods": [ { "kind": "function", "name": "AtomicCounter.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AtomicCounter.inc", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AtomicCounter.dec", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "AtomicCounter.value", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 0, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.utils.counter", "names": [ "vllm.utils.counter.AtomicCounter", "vllm.utils.counter.Counter" ], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 4, "n_classes": 2, "n_attrs": 1, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/utils/deep_gemm.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.deep_gemm.per_block_cast_to_fp8", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.utils.deep_gemm.fp8_paged_mqa_logits_torch", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.utils.deep_gemm.m_grouped_fp8_gemm_nt_contiguous", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.utils.deep_gemm.DeepGemmQuantScaleFMT", "methods": [ { "kind": "function", "name": "DeepGemmQuantScaleFMT.init_oracle_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepGemmQuantScaleFMT.from_oracle", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepGemmQuantScaleFMT.FLOAT32", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepGemmQuantScaleFMT.FLOAT32_CEIL_UE8M0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepGemmQuantScaleFMT.UE8M0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.utils.deep_gemm.fp8_gemm_nt", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.deep_gemm.fp8_paged_mqa_logits", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.utils.deep_gemm.get_mk_alignment_for_contiguous_layout", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.deep_gemm.get_col_major_tma_aligned_tensor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.deep_gemm.calc_diff", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.deep_gemm.fp8_mqa_logits_torch", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.utils.deep_gemm.is_deep_gemm_e8m0_used", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.deep_gemm.fp8_mqa_logits", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.utils.deep_gemm.should_use_deepgemm_for_fp8_linear", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.utils.deep_gemm.get_paged_mqa_logits_metadata", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.utils.deep_gemm.is_deep_gemm_supported", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.deep_gemm.get_num_sms", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.deep_gemm.fp8_m_grouped_gemm_nt_masked", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.utils.deep_gemm", "names": [ "vllm.utils.deep_gemm.DeepGemmQuantScaleFMT", "vllm.utils.deep_gemm.calc_diff", "vllm.utils.deep_gemm.fp8_gemm_nt", "vllm.utils.deep_gemm.fp8_m_grouped_gemm_nt_masked", "vllm.utils.deep_gemm.fp8_mqa_logits", "vllm.utils.deep_gemm.fp8_mqa_logits_torch", "vllm.utils.deep_gemm.fp8_paged_mqa_logits", "vllm.utils.deep_gemm.fp8_paged_mqa_logits_torch", "vllm.utils.deep_gemm.get_col_major_tma_aligned_tensor", "vllm.utils.deep_gemm.get_mk_alignment_for_contiguous_layout", "vllm.utils.deep_gemm.get_num_sms", "vllm.utils.deep_gemm.get_paged_mqa_logits_metadata", "vllm.utils.deep_gemm.is_deep_gemm_e8m0_used", "vllm.utils.deep_gemm.is_deep_gemm_supported", "vllm.utils.deep_gemm.m_grouped_fp8_gemm_nt_contiguous", "vllm.utils.deep_gemm.per_block_cast_to_fp8", "vllm.utils.deep_gemm.should_use_deepgemm_for_fp8_linear" ], "n_typable": 61, "n_typed": 50, "n_any": 0, "n_untyped": 11, "n_functions": 16, "n_function_overloads": 16, "n_function_params": 43, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/flashinfer.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.flashinfer.has_flashinfer_comm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.flashinfer.use_trtllm_attention", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "vllm.utils.flashinfer.flashinfer_scaled_fp4_mm", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "attr", "name": "vllm.utils.flashinfer.flashinfer_fp4_quantize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.utils.flashinfer.flashinfer_cutlass_fused_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.utils.flashinfer.scaled_fp4_grouped_quantize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.utils.flashinfer.silu_and_mul_scaled_nvfp4_experts_quantize", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.utils.flashinfer.has_flashinfer_fp8_blockscale_gemm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.utils.flashinfer.flashinfer_cutedsl_grouped_gemm_nt_masked", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.utils.flashinfer.can_use_trtllm_attention", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.flashinfer.has_flashinfer_cutedsl_grouped_gemm_nt_masked", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.flashinfer.is_flashinfer_fp8_blockscale_gemm_supported", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.flashinfer.flashinfer_scaled_fp8_mm", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.utils.flashinfer.flashinfer_quant_nvfp4_8x4_sf_layout", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.flashinfer.should_use_flashinfer_for_blockscale_fp8_gemm", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.utils.flashinfer.has_nvidia_artifactory", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.flashinfer.has_flashinfer_moe", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.utils.flashinfer.flashinfer_fp8_blockscale_gemm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.utils.flashinfer.trtllm_fp4_block_scale_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.utils.flashinfer.flashinfer_trtllm_fp8_block_scale_moe", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.utils.flashinfer.has_flashinfer_cutlass_fused_moe", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.utils.flashinfer.nvfp4_block_scale_interleave", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.utils.flashinfer.has_flashinfer_all2all", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.flashinfer.has_flashinfer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.utils.flashinfer.autotune", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.utils.flashinfer.supports_trtllm_attention", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.utils.flashinfer", "names": [ "vllm.utils.flashinfer.autotune", "vllm.utils.flashinfer.can_use_trtllm_attention", "vllm.utils.flashinfer.flashinfer_cutedsl_grouped_gemm_nt_masked", "vllm.utils.flashinfer.flashinfer_cutlass_fused_moe", "vllm.utils.flashinfer.flashinfer_fp4_quantize", "vllm.utils.flashinfer.flashinfer_fp8_blockscale_gemm", "vllm.utils.flashinfer.flashinfer_quant_nvfp4_8x4_sf_layout", "vllm.utils.flashinfer.flashinfer_scaled_fp4_mm", "vllm.utils.flashinfer.flashinfer_scaled_fp8_mm", "vllm.utils.flashinfer.flashinfer_trtllm_fp8_block_scale_moe", "vllm.utils.flashinfer.has_flashinfer", "vllm.utils.flashinfer.has_flashinfer_all2all", "vllm.utils.flashinfer.has_flashinfer_comm", "vllm.utils.flashinfer.has_flashinfer_cutedsl_grouped_gemm_nt_masked", "vllm.utils.flashinfer.has_flashinfer_cutlass_fused_moe", "vllm.utils.flashinfer.has_flashinfer_fp8_blockscale_gemm", "vllm.utils.flashinfer.has_flashinfer_moe", "vllm.utils.flashinfer.has_nvidia_artifactory", "vllm.utils.flashinfer.is_flashinfer_fp8_blockscale_gemm_supported", "vllm.utils.flashinfer.nvfp4_block_scale_interleave", "vllm.utils.flashinfer.scaled_fp4_grouped_quantize", "vllm.utils.flashinfer.should_use_flashinfer_for_blockscale_fp8_gemm", "vllm.utils.flashinfer.silu_and_mul_scaled_nvfp4_experts_quantize", "vllm.utils.flashinfer.supports_trtllm_attention", "vllm.utils.flashinfer.trtllm_fp4_block_scale_moe", "vllm.utils.flashinfer.use_trtllm_attention" ], "n_typable": 58, "n_typed": 47, "n_any": 0, "n_untyped": 11, "n_functions": 16, "n_function_overloads": 16, "n_function_params": 32, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/func_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.func_utils.get_allowed_kwarg_only_overrides", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.utils.func_utils.supports_kw", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.utils.func_utils.P", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.utils.func_utils.deprecate_args", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.utils.func_utils.identity", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.func_utils.run_once", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.utils.func_utils.F", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.utils.func_utils.T", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.utils.func_utils.deprecate_kwargs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.utils.func_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.utils.func_utils", "names": [ "vllm.utils.func_utils.F", "vllm.utils.func_utils.P", "vllm.utils.func_utils.T", "vllm.utils.func_utils.deprecate_args", "vllm.utils.func_utils.deprecate_kwargs", "vllm.utils.func_utils.get_allowed_kwarg_only_overrides", "vllm.utils.func_utils.identity", "vllm.utils.func_utils.logger", "vllm.utils.func_utils.run_once", "vllm.utils.func_utils.supports_kw" ], "n_typable": 24, "n_typed": 22, "n_any": 0, "n_untyped": 2, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 17, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/gc_utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.utils.gc_utils.GCDebugConfig", "methods": [ { "kind": "function", "name": "GCDebugConfig.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GCDebugConfig.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GCDebugConfig.enabled", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GCDebugConfig.top_objects", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.utils.gc_utils.GCDebugger", "methods": [ { "kind": "function", "name": "GCDebugger.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GCDebugger.handle", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GCDebugger.config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GCDebugger.start_time_ns", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GCDebugger.num_objects", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GCDebugger.gc_top_collected_objects", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.utils.gc_utils.maybe_attach_gc_debug_callback", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.gc_utils.freeze_gc_heap", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.utils.gc_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.utils.gc_utils", "names": [ "vllm.utils.gc_utils.GCDebugConfig", "vllm.utils.gc_utils.GCDebugger", "vllm.utils.gc_utils.freeze_gc_heap", "vllm.utils.gc_utils.logger", "vllm.utils.gc_utils.maybe_attach_gc_debug_callback" ], "n_typable": 17, "n_typed": 15, "n_any": 0, "n_untyped": 2, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_classes": 2, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/hashing.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.hashing.get_hash_fn_by_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.hashing.xxhash", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.hashing.safe_hash", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.hashing.xxhash_cbor", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.hashing.sha256_cbor", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.hashing.sha256", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.utils.hashing", "names": [ "vllm.utils.hashing.get_hash_fn_by_name", "vllm.utils.hashing.safe_hash", "vllm.utils.hashing.sha256", "vllm.utils.hashing.sha256_cbor", "vllm.utils.hashing.xxhash", "vllm.utils.hashing.xxhash_cbor" ], "n_typable": 13, "n_typed": 9, "n_any": 4, "n_untyped": 0, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/import_utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.utils.import_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.utils.import_utils.has_deep_gemm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.utils.import_utils.PlaceholderModule", "methods": [ { "kind": "function", "name": "PlaceholderModule.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PlaceholderModule.placeholder_attr", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PlaceholderModule.__getattr__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.utils.import_utils.import_from_path", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.import_utils.has_aiter", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.import_utils.import_pynvml", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.import_utils.has_mori", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.import_utils.import_triton_kernels", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.import_utils.has_deep_ep", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.import_utils.has_triton_kernels", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.import_utils.has_tilelang", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.import_utils.has_arctic_inference", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.utils.import_utils.LazyLoader", "methods": [ { "kind": "function", "name": "LazyLoader.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LazyLoader._load", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LazyLoader.__getattr__", "n_typed": 0, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LazyLoader.__dir__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 5, "n_any": 2, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.utils.import_utils.resolve_obj_by_qualname", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.import_utils.has_helion", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.import_utils.get_vllm_optional_dependencies", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.utils.import_utils", "names": [ "vllm.utils.import_utils.LazyLoader", "vllm.utils.import_utils.PlaceholderModule", "vllm.utils.import_utils.get_vllm_optional_dependencies", "vllm.utils.import_utils.has_aiter", "vllm.utils.import_utils.has_arctic_inference", "vllm.utils.import_utils.has_deep_ep", "vllm.utils.import_utils.has_deep_gemm", "vllm.utils.import_utils.has_helion", "vllm.utils.import_utils.has_mori", "vllm.utils.import_utils.has_tilelang", "vllm.utils.import_utils.has_triton_kernels", "vllm.utils.import_utils.import_from_path", "vllm.utils.import_utils.import_pynvml", "vllm.utils.import_utils.import_triton_kernels", "vllm.utils.import_utils.logger", "vllm.utils.import_utils.resolve_obj_by_qualname" ], "n_typable": 31, "n_typed": 21, "n_any": 3, "n_untyped": 7, "n_functions": 13, "n_function_overloads": 13, "n_function_params": 3, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 7, "n_classes": 2, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/jsontree.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.utils.jsontree.JSONTree", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.utils.jsontree.json_map_leaves", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 5, "n_typable": 3, "n_params": 2, "n_function_overloads": 5, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.jsontree.json_reduce_leaves", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 5, "n_typable": 4, "n_params": 3, "n_function_overloads": 5, "n_function_params": 3 }, { "kind": "function", "name": "vllm.utils.jsontree.json_iter_leaves", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.jsontree.json_count_leaves", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.utils.jsontree", "names": [ "vllm.utils.jsontree.JSONTree", "vllm.utils.jsontree.json_count_leaves", "vllm.utils.jsontree.json_iter_leaves", "vllm.utils.jsontree.json_map_leaves", "vllm.utils.jsontree.json_reduce_leaves" ], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 4, "n_function_overloads": 12, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/math_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.math_utils.round_down", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.math_utils.largest_power_of_2_divisor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.math_utils.next_power_of_2", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.math_utils.prev_power_of_2", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.math_utils.round_up", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.utils.math_utils.RCP_LN2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.utils.math_utils.cdiv", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.utils.math_utils", "names": [ "vllm.utils.math_utils.RCP_LN2", "vllm.utils.math_utils.cdiv", "vllm.utils.math_utils.largest_power_of_2_divisor", "vllm.utils.math_utils.next_power_of_2", "vllm.utils.math_utils.prev_power_of_2", "vllm.utils.math_utils.round_down", "vllm.utils.math_utils.round_up" ], "n_typable": 15, "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 9, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/mem_constants.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.utils.mem_constants.GB_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.utils.mem_constants.MB_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.utils.mem_constants.GiB_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.utils.mem_constants.MiB_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.utils.mem_constants", "names": [ "vllm.utils.mem_constants.GB_bytes", "vllm.utils.mem_constants.GiB_bytes", "vllm.utils.mem_constants.MB_bytes", "vllm.utils.mem_constants.MiB_bytes" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/mem_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.mem_utils.format_gib", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.mem_utils.get_cpu_memory", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.utils.mem_utils.MemorySnapshot", "methods": [ { "kind": "function", "name": "MemorySnapshot.__post_init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MemorySnapshot.measure", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MemorySnapshot.__sub__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MemorySnapshot.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MemorySnapshot.torch_peak", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MemorySnapshot.free_memory", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MemorySnapshot.total_memory", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MemorySnapshot.cuda_memory", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MemorySnapshot.torch_memory", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MemorySnapshot.non_torch_memory", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MemorySnapshot.timestamp", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MemorySnapshot.device", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MemorySnapshot.auto_measure", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 1, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.utils.mem_utils.DeviceMemoryProfiler", "methods": [ { "kind": "function", "name": "DeviceMemoryProfiler.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DeviceMemoryProfiler.current_memory_usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeviceMemoryProfiler.__enter__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeviceMemoryProfiler.__exit__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeviceMemoryProfiler.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 2, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.utils.mem_utils.format_mib", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.mem_utils.get_max_shared_memory_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.mem_utils.memory_profiling", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.utils.mem_utils.MemoryProfilingResult", "methods": [ { "kind": "function", "name": "MemoryProfilingResult.__post_init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MemoryProfilingResult.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MemoryProfilingResult.non_kv_cache_memory", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MemoryProfilingResult.torch_peak_increase", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MemoryProfilingResult.non_torch_increase", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MemoryProfilingResult.weights_memory", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MemoryProfilingResult.before_create", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MemoryProfilingResult.profile_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.utils.mem_utils", "names": [ "vllm.utils.mem_utils.DeviceMemoryProfiler", "vllm.utils.mem_utils.MemoryProfilingResult", "vllm.utils.mem_utils.MemorySnapshot", "vllm.utils.mem_utils.format_gib", "vllm.utils.mem_utils.format_mib", "vllm.utils.mem_utils.get_cpu_memory", "vllm.utils.mem_utils.get_max_shared_memory_bytes", "vllm.utils.mem_utils.memory_profiling" ], "n_typable": 26, "n_typed": 19, "n_any": 0, "n_untyped": 7, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 5, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 5, "n_classes": 3, "n_attrs": 16, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/mistral.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.mistral.is_mistral_tokenizer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.utils.mistral.mt", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.utils.mistral", "names": [ "vllm.utils.mistral.is_mistral_tokenizer", "vllm.utils.mistral.mt" ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/nccl.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.nccl.find_nccl_library", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.utils.nccl.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.utils.nccl.find_nccl_include_paths", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.utils.nccl", "names": [ "vllm.utils.nccl.find_nccl_include_paths", "vllm.utils.nccl.find_nccl_library", "vllm.utils.nccl.logger" ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/network_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.network_utils.test_loopback_bind", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.network_utils.make_zmq_socket", "n_typed": 6, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.utils.network_utils.zmq_socket_ctx", "n_typed": 5, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.utils.network_utils.close_sockets", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.network_utils.is_valid_ipv6_address", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.network_utils.make_zmq_path", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.utils.network_utils.get_distributed_init_method", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.network_utils.join_host_port", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.network_utils.split_host_port", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.network_utils.get_open_zmq_ipc_path", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.network_utils.split_zmq_path", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.network_utils.get_ip", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.network_utils.get_open_zmq_inproc_path", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.network_utils.get_open_ports_list", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.network_utils.get_open_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.network_utils.get_loopback_ip", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.utils.network_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.utils.network_utils.find_process_using_port", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.network_utils.get_tcp_uri", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [ { "kind": "type", "rules": [ "name-defined" ] } ], "name": "vllm.utils.network_utils", "names": [ "vllm.utils.network_utils.close_sockets", "vllm.utils.network_utils.find_process_using_port", "vllm.utils.network_utils.get_distributed_init_method", "vllm.utils.network_utils.get_ip", "vllm.utils.network_utils.get_loopback_ip", "vllm.utils.network_utils.get_open_port", "vllm.utils.network_utils.get_open_ports_list", "vllm.utils.network_utils.get_open_zmq_inproc_path", "vllm.utils.network_utils.get_open_zmq_ipc_path", "vllm.utils.network_utils.get_tcp_uri", "vllm.utils.network_utils.is_valid_ipv6_address", "vllm.utils.network_utils.join_host_port", "vllm.utils.network_utils.logger", "vllm.utils.network_utils.make_zmq_path", "vllm.utils.network_utils.make_zmq_socket", "vllm.utils.network_utils.split_host_port", "vllm.utils.network_utils.split_zmq_path", "vllm.utils.network_utils.test_loopback_bind", "vllm.utils.network_utils.zmq_socket_ctx" ], "n_typable": 47, "n_typed": 43, "n_any": 2, "n_untyped": 2, "n_functions": 18, "n_function_overloads": 18, "n_function_params": 28, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/utils/nvtx_pytorch_hooks.py", "symbol_reports": [ { "kind": "class", "name": "vllm.utils.nvtx_pytorch_hooks.ResultHolder", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ResultHolder.result", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.utils.nvtx_pytorch_hooks.process_layer_params", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.nvtx_pytorch_hooks.layerwise_nvtx_marker_context", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.utils.nvtx_pytorch_hooks.PytHooks", "methods": [ { "kind": "function", "name": "PytHooks.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PytHooks._process_layer_params", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PytHooks.module_fwd_hook", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PytHooks.module_fwd_pre_hook", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PytHooks.register_hooks", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PytHooks.module_to_name_map", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 0, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.utils.nvtx_pytorch_hooks.print_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.utils.nvtx_pytorch_hooks.construct_marker_dict_and_push", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.utils.nvtx_pytorch_hooks", "names": [ "vllm.utils.nvtx_pytorch_hooks.PytHooks", "vllm.utils.nvtx_pytorch_hooks.ResultHolder", "vllm.utils.nvtx_pytorch_hooks.construct_marker_dict_and_push", "vllm.utils.nvtx_pytorch_hooks.layerwise_nvtx_marker_context", "vllm.utils.nvtx_pytorch_hooks.print_tensor", "vllm.utils.nvtx_pytorch_hooks.process_layer_params" ], "n_typable": 32, "n_typed": 0, "n_any": 0, "n_untyped": 32, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 13, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_classes": 2, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/platform_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.platform_utils.cuda_is_initialized", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.platform_utils.num_compute_units", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.platform_utils.is_uva_available", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.platform_utils.xpu_is_initialized", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.platform_utils.cuda_get_device_properties", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.utils.platform_utils.is_pin_memory_available", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.utils.platform_utils", "names": [ "vllm.utils.platform_utils.cuda_get_device_properties", "vllm.utils.platform_utils.cuda_is_initialized", "vllm.utils.platform_utils.is_pin_memory_available", "vllm.utils.platform_utils.is_uva_available", "vllm.utils.platform_utils.num_compute_units", "vllm.utils.platform_utils.xpu_is_initialized" ], "n_typable": 10, "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 4, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/print_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.print_utils.print_embeddings", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.utils.print_utils", "names": [ "vllm.utils.print_utils.print_embeddings" ], "n_typable": 2, "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/profiling.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.profiling.cprofile_context", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.profiling.cprofile", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.utils.profiling", "names": [ "vllm.utils.profiling.cprofile", "vllm.utils.profiling.cprofile_context" ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/registry.py", "symbol_reports": [ { "kind": "class", "name": "vllm.utils.registry.ExtensionManager", "methods": [ { "kind": "function", "name": "ExtensionManager.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ExtensionManager.register", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExtensionManager.load", "n_typed": 1, "n_any": 1, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExtensionManager.name2class", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 8, "n_typed": 4, "n_any": 1, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.utils.registry", "names": [ "vllm.utils.registry.ExtensionManager" ], "n_typable": 8, "n_typed": 4, "n_any": 1, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/serial_utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.utils.serial_utils.DTypeInfo", "methods": [], "properties": [ { "kind": "property", "name": "DTypeInfo.nbytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "DTypeInfo.torch_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DTypeInfo.torch_view_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DTypeInfo.numpy_view_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 1 }, { "kind": "attr", "name": "vllm.utils.serial_utils.ENDIANNESS", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.utils.serial_utils.EmbedDType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.utils.serial_utils.Endianness", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.utils.serial_utils.EncodingFormat", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.utils.serial_utils.binary2tensor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.utils.serial_utils.EMBED_DTYPES", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.utils.serial_utils.tensor2binary", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.utils.serial_utils.tensor2base64", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.utils.serial_utils", "names": [ "vllm.utils.serial_utils.DTypeInfo", "vllm.utils.serial_utils.EMBED_DTYPES", "vllm.utils.serial_utils.ENDIANNESS", "vllm.utils.serial_utils.EmbedDType", "vllm.utils.serial_utils.EncodingFormat", "vllm.utils.serial_utils.Endianness", "vllm.utils.serial_utils.binary2tensor", "vllm.utils.serial_utils.tensor2base64", "vllm.utils.serial_utils.tensor2binary" ], "n_typable": 17, "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 8, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 8, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/utils/system_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.system_utils.update_environment_variables", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.system_utils.suppress_stdout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.utils.system_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.utils.system_utils.get_mp_context", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.system_utils.unique_filepath", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.system_utils.decorate_logs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.utils.system_utils.CYAN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.utils.system_utils.set_env_var", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.utils.system_utils.RESET", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.utils.system_utils.find_loaded_library", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.system_utils.set_process_title", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.utils.system_utils.kill_process_tree", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.system_utils.set_ulimit", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.utils.system_utils", "names": [ "vllm.utils.system_utils.CYAN", "vllm.utils.system_utils.RESET", "vllm.utils.system_utils.decorate_logs", "vllm.utils.system_utils.find_loaded_library", "vllm.utils.system_utils.get_mp_context", "vllm.utils.system_utils.kill_process_tree", "vllm.utils.system_utils.logger", "vllm.utils.system_utils.set_env_var", "vllm.utils.system_utils.set_process_title", "vllm.utils.system_utils.set_ulimit", "vllm.utils.system_utils.suppress_stdout", "vllm.utils.system_utils.unique_filepath", "vllm.utils.system_utils.update_environment_variables" ], "n_typable": 22, "n_typed": 16, "n_any": 0, "n_untyped": 6, "n_functions": 10, "n_function_overloads": 10, "n_function_params": 11, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/tensor_schema.py", "symbol_reports": [ { "kind": "class", "name": "vllm.utils.tensor_schema.TensorSchema", "methods": [ { "kind": "function", "name": "TensorSchema.__init__", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TensorSchema.__getitem__", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TensorSchema.get", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TensorSchema._match_shape_with_dynamic", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "TensorSchema._fmt_indexer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TensorSchema._validate_field", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "TensorSchema._validate_tensor_shape_expected", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "TensorSchema.validate", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TensorSchema.print_shapes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 30, "n_typed": 26, "n_any": 4, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 21, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.utils.tensor_schema.TensorShape", "methods": [ { "kind": "function", "name": "TensorShape.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TensorShape.resolve", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TensorShape.__str__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TensorShape.dims", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TensorShape.dynamic_dims", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.utils.tensor_schema.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.utils.tensor_schema", "names": [ "vllm.utils.tensor_schema.TensorSchema", "vllm.utils.tensor_schema.TensorShape", "vllm.utils.tensor_schema.logger" ], "n_typable": 39, "n_typed": 32, "n_any": 4, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 24, "n_classes": 2, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/utils/torch_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.torch_utils.is_torch_equal_or_newer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.torch_utils.kv_cache_dtype_str_to_dtype", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.utils.torch_utils.HAS_OPAQUE_TYPE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.utils.torch_utils.get_kv_cache_quant_algo_string", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.utils.torch_utils.TORCH_DTYPE_TO_NUMPY_DTYPE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.utils.torch_utils.get_kv_cache_quant_algo_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.torch_utils.direct_register_custom_op", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.utils.torch_utils.weak_ref_tensor", "n_typed": 0, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.utils.torch_utils.ModelConfig", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.utils.torch_utils.STR_DTYPE_TO_TORCH_DTYPE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.utils.torch_utils.create_kv_caches_with_random", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "attr", "name": "vllm.utils.torch_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.utils.torch_utils.async_tensor_h2d", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.utils.torch_utils.get_dtype_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.torch_utils.get_kv_cache_torch_dtype", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.torch_utils.set_default_torch_num_threads", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.torch_utils.cuda_device_count_stateless", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.torch_utils.common_broadcastable_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.utils.torch_utils.IntermediateTensors", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.utils.torch_utils.MODELOPT_TO_VLLM_KV_CACHE_DTYPE_MAP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.utils.torch_utils.vllm_lib", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.utils.torch_utils.supports_xccl", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.torch_utils.aux_stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.utils.torch_utils.OpaqueBase", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.utils.torch_utils.T", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.utils.torch_utils.is_strictly_contiguous", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.torch_utils.is_lossless_cast", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.torch_utils.current_stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.torch_utils.set_random_seed", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.torch_utils.weak_ref_tensors", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.torch_utils.is_torch_equal", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.torch_utils.resolve_kv_cache_dtype_string", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.utils.torch_utils.set_default_torch_dtype", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.utils.torch_utils.ModuleName", "methods": [ { "kind": "function", "name": "ModuleName.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModuleName.__eq__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModuleName.__hash__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModuleName.__fx_repr__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModuleName.value", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 1, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.utils.torch_utils.make_tensor_with_pad", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.utils.torch_utils.supports_xpu_graph", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.torch_utils.get_accelerator_view_from_cpu_tensor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.utils.torch_utils.make_ndarray_with_pad", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.utils.torch_utils.guard_cuda_initialization", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.utils.torch_utils.create_kv_caches_with_random_flash", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 } ], "type_ignores": [ { "kind": "type", "rules": [ "assignment", "misc" ] }, { "kind": "type", "rules": [ "misc" ] } ], "name": "vllm.utils.torch_utils", "names": [ "vllm.utils.torch_utils.HAS_OPAQUE_TYPE", "vllm.utils.torch_utils.IntermediateTensors", "vllm.utils.torch_utils.MODELOPT_TO_VLLM_KV_CACHE_DTYPE_MAP", "vllm.utils.torch_utils.ModelConfig", "vllm.utils.torch_utils.ModuleName", "vllm.utils.torch_utils.OpaqueBase", "vllm.utils.torch_utils.STR_DTYPE_TO_TORCH_DTYPE", "vllm.utils.torch_utils.T", "vllm.utils.torch_utils.TORCH_DTYPE_TO_NUMPY_DTYPE", "vllm.utils.torch_utils.async_tensor_h2d", "vllm.utils.torch_utils.aux_stream", "vllm.utils.torch_utils.common_broadcastable_dtype", "vllm.utils.torch_utils.create_kv_caches_with_random", "vllm.utils.torch_utils.create_kv_caches_with_random_flash", "vllm.utils.torch_utils.cuda_device_count_stateless", "vllm.utils.torch_utils.current_stream", "vllm.utils.torch_utils.direct_register_custom_op", "vllm.utils.torch_utils.get_accelerator_view_from_cpu_tensor", "vllm.utils.torch_utils.get_dtype_size", "vllm.utils.torch_utils.get_kv_cache_quant_algo_dtype", "vllm.utils.torch_utils.get_kv_cache_quant_algo_string", "vllm.utils.torch_utils.get_kv_cache_torch_dtype", "vllm.utils.torch_utils.guard_cuda_initialization", "vllm.utils.torch_utils.is_lossless_cast", "vllm.utils.torch_utils.is_strictly_contiguous", "vllm.utils.torch_utils.is_torch_equal", "vllm.utils.torch_utils.is_torch_equal_or_newer", "vllm.utils.torch_utils.kv_cache_dtype_str_to_dtype", "vllm.utils.torch_utils.logger", "vllm.utils.torch_utils.make_ndarray_with_pad", "vllm.utils.torch_utils.make_tensor_with_pad", "vllm.utils.torch_utils.resolve_kv_cache_dtype_string", "vllm.utils.torch_utils.set_default_torch_dtype", "vllm.utils.torch_utils.set_default_torch_num_threads", "vllm.utils.torch_utils.set_random_seed", "vllm.utils.torch_utils.supports_xccl", "vllm.utils.torch_utils.supports_xpu_graph", "vllm.utils.torch_utils.vllm_lib", "vllm.utils.torch_utils.weak_ref_tensor", "vllm.utils.torch_utils.weak_ref_tensors" ], "n_typable": 100, "n_typed": 83, "n_any": 2, "n_untyped": 15, "n_functions": 29, "n_function_overloads": 29, "n_function_params": 61, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_classes": 1, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 2 }, { "path": "vllm/utils/tqdm_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.utils.tqdm_utils.maybe_tqdm", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 2, "n_typable": 4, "n_params": 3, "n_function_overloads": 2, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.utils.tqdm_utils", "names": [ "vllm.utils.tqdm_utils.maybe_tqdm" ], "n_typable": 4, "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 2, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backend.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backend.AttentionImpl", "methods": [ { "kind": "function", "name": "AttentionImpl.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "AttentionImpl.forward", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "AttentionImpl.fused_output_quant_supported", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttentionImpl.fused_rope_kvcache_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionImpl.do_rope_and_kv_cache_update", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "properties": [], "attrs": [], "n_typable": 34, "n_typed": 31, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 29, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backend.CommonAttentionMetadata", "methods": [ { "kind": "function", "name": "CommonAttentionMetadata.batch_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CommonAttentionMetadata.naive_query_lens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CommonAttentionMetadata.replace", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CommonAttentionMetadata.compute_num_computed_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CommonAttentionMetadata.unpadded", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "CommonAttentionMetadata.seq_lens_cpu", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "CommonAttentionMetadata.num_computed_tokens_cpu", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "CommonAttentionMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata.query_start_loc_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata.num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata.num_actual_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata.block_table_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata.causal", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata.logits_indices_padded", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata.num_logits_indices", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata.encoder_seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata.encoder_seq_lens_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata.dcp_local_seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata.dcp_local_seq_lens_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata._seq_lens_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata._num_computed_tokens_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CommonAttentionMetadata._num_computed_tokens_cache", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 3, "n_attrs": 19, "n_properties": 2 }, { "kind": "class", "name": "vllm.v1.attention.backend.AttentionCGSupport", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AttentionCGSupport.ALWAYS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionCGSupport.UNIFORM_BATCH", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionCGSupport.UNIFORM_SINGLE_TOKEN_DECODE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionCGSupport.NEVER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backend.AttentionBackend", "methods": [ { "kind": "function", "name": "AttentionBackend.get_supported_kernel_block_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionBackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionBackend.get_builder_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "AttentionBackend.get_kv_cache_block_dim", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AttentionBackend.get_kv_cache_stride_order", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttentionBackend.full_cls_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionBackend.get_supported_head_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionBackend.supports_head_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttentionBackend.supports_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttentionBackend.supports_kv_cache_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttentionBackend.supports_block_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttentionBackend.is_mla", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionBackend.supports_sink", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionBackend.supports_alibi_sqrt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionBackend.supports_mm_prefix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionBackend.is_sparse", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionBackend.supports_per_head_quant_scales", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionBackend.supports_attn_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttentionBackend.supports_compute_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttentionBackend.supports_combination", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "AttentionBackend.validate_configuration", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "AttentionBackend.get_required_kv_cache_layout", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AttentionBackend.accept_output_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionBackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionBackend.supported_kv_cache_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionBackend.forward_includes_kv_cache_update", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 63, "n_typed": 62, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 24, "n_method_overloads": 24, "n_method_params": 35, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backend.AttentionMetadataBuilder", "methods": [ { "kind": "function", "name": "AttentionMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AttentionMetadataBuilder.get_cudagraph_support", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AttentionMetadataBuilder._init_reorder_batch_threshold", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AttentionMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AttentionMetadataBuilder.update_block_table", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AttentionMetadataBuilder.build_for_cudagraph_capture", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttentionMetadataBuilder.build_for_drafting", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AttentionMetadataBuilder.use_cascade_attention", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AttentionMetadataBuilder._cudagraph_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionMetadataBuilder.reorder_batch_threshold", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionMetadataBuilder.supports_update_block_table", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionMetadataBuilder.kv_cache_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AttentionMetadataBuilder.layer_names", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AttentionMetadataBuilder.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AttentionMetadataBuilder.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 42, "n_typed": 37, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 27, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backend.M", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.attention.backend.SparseMLAAttentionImpl", "methods": [ { "kind": "function", "name": "SparseMLAAttentionImpl.__init__", "n_typed": 20, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 20, "n_params": 19, "n_function_overloads": 1, "n_function_params": 19 }, { "kind": "function", "name": "SparseMLAAttentionImpl.forward_mqa", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SparseMLAAttentionImpl.do_kv_cache_update", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [], "n_typable": 32, "n_typed": 32, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 29, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backend.is_quantized_kv_cache", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.v1.attention.backend.T", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.attention.backend.subclass_attention_backend", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.v1.attention.backend.AttentionType", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AttentionType.DECODER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionType.ENCODER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionType.ENCODER_ONLY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionType.ENCODER_DECODER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backend.AttentionLayer", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backend.AttentionMetadata", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backend.AttentionImplBase", "methods": [ { "kind": "function", "name": "AttentionImplBase.__new__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AttentionImplBase.process_weights_after_loading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AttentionImplBase.num_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionImplBase.head_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionImplBase.scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionImplBase.can_return_lse_for_decode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionImplBase.supports_pcp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionImplBase.supports_mtp_with_cp_non_trivial_interleave_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionImplBase.need_to_return_lse_for_decode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionImplBase.supports_quant_query_input", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionImplBase.dcp_world_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionImplBase.dcp_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionImplBase.pcp_world_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionImplBase.pcp_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionImplBase.total_cp_world_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionImplBase.total_cp_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 19, "n_typed": 15, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 14, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backend.subclass_attention_backend_with_overrides", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.v1.attention.backend.MultipleOf", "methods": [ { "kind": "function", "name": "MultipleOf.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultipleOf.base", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backend.MLAAttentionImpl", "methods": [ { "kind": "function", "name": "MLAAttentionImpl.__init__", "n_typed": 20, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 20, "n_params": 19, "n_function_overloads": 1, "n_function_params": 19 }, { "kind": "function", "name": "MLAAttentionImpl.forward_mha", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "MLAAttentionImpl.forward_mqa", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MLAAttentionImpl.do_kv_cache_update", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [], "n_typable": 40, "n_typed": 40, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 36, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backend", "names": [ "vllm.v1.attention.backend.AttentionBackend", "vllm.v1.attention.backend.AttentionCGSupport", "vllm.v1.attention.backend.AttentionImpl", "vllm.v1.attention.backend.AttentionImplBase", "vllm.v1.attention.backend.AttentionLayer", "vllm.v1.attention.backend.AttentionMetadata", "vllm.v1.attention.backend.AttentionMetadataBuilder", "vllm.v1.attention.backend.AttentionType", "vllm.v1.attention.backend.CommonAttentionMetadata", "vllm.v1.attention.backend.M", "vllm.v1.attention.backend.MLAAttentionImpl", "vllm.v1.attention.backend.MultipleOf", "vllm.v1.attention.backend.SparseMLAAttentionImpl", "vllm.v1.attention.backend.T", "vllm.v1.attention.backend.is_quantized_kv_cache", "vllm.v1.attention.backend.subclass_attention_backend", "vllm.v1.attention.backend.subclass_attention_backend_with_overrides" ], "n_typable": 253, "n_typed": 238, "n_any": 0, "n_untyped": 15, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 7, "n_methods": 52, "n_method_overloads": 52, "n_method_params": 163, "n_classes": 12, "n_attrs": 55, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/cpu_attn.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.cpu_attn.CPUAttentionMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CPUAttentionMetadata.isa", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CPUAttentionMetadata.num_actual_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CPUAttentionMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CPUAttentionMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CPUAttentionMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CPUAttentionMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CPUAttentionMetadata.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CPUAttentionMetadata.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CPUAttentionMetadata.scheduler_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CPUAttentionMetadata.causal", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CPUAttentionMetadata.use_sdpa_prefill", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CPUAttentionMetadata.num_decode_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CPUAttentionMetadata.sdpa_attn_masks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CPUAttentionMetadata.sdpa_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.cpu_attn.CPUAttentionBackend", "methods": [ { "kind": "function", "name": "CPUAttentionBackend.get_supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUAttentionBackend.get_supported_head_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUAttentionBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUAttentionBackend.supports_attn_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUAttentionBackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUAttentionBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUAttentionBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CPUAttentionBackend.use_cascade_attention", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CPUAttentionBackend.accept_output_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionBackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 8, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.cpu_attn.CPUAttentionMetadataBuilder", "methods": [ { "kind": "function", "name": "CPUAttentionMetadataBuilder.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CPUAttentionMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CPUAttentionMetadataBuilder.use_sdpa_prefill", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionMetadataBuilder.kv_cache_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionMetadataBuilder.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionMetadataBuilder.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionMetadataBuilder.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionMetadataBuilder.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionMetadataBuilder.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionMetadataBuilder.window_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionMetadataBuilder.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionMetadataBuilder.isa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionMetadataBuilder.is_cross_attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 9, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 11, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.cpu_attn.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.cpu_attn.CPUAttentionBackendImpl", "methods": [ { "kind": "function", "name": "CPUAttentionBackendImpl.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "CPUAttentionBackendImpl.forward", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "CPUAttentionBackendImpl._run_sdpa_forward", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CPUAttentionBackendImpl.kv_sharing_target_layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionBackendImpl.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionBackendImpl.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionBackendImpl.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionBackendImpl.logits_soft_cap", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionBackendImpl.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionBackendImpl.alibi_slopes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionBackendImpl.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionBackendImpl.num_queries_per_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionBackendImpl.attn_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionBackendImpl.sinks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUAttentionBackendImpl.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 41, "n_typed": 29, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 26, "n_attrs": 12, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.cpu_attn", "names": [ "vllm.v1.attention.backends.cpu_attn.CPUAttentionBackend", "vllm.v1.attention.backends.cpu_attn.CPUAttentionBackendImpl", "vllm.v1.attention.backends.cpu_attn.CPUAttentionMetadata", "vllm.v1.attention.backends.cpu_attn.CPUAttentionMetadataBuilder", "vllm.v1.attention.backends.cpu_attn.logger" ], "n_typable": 80, "n_typed": 54, "n_any": 0, "n_untyped": 26, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 41, "n_classes": 4, "n_attrs": 40, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/fa_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.attention.backends.fa_utils.flash_attn_varlen_func", "n_typed": 0, "n_any": 3, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.attention.backends.fa_utils.get_flash_attn_version", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.attention.backends.fa_utils.get_scheduler_metadata", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.attention.backends.fa_utils.flash_attn_supports_sinks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.fa_utils.flash_attn_supports_fp8", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.fa_utils.flash_attn_supports_mla", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.fa_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.attention.backends.fa_utils.is_flash_attn_varlen_func_available", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [ { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "no-redef" ] }, { "kind": "type", "rules": [ "misc", "no-redef" ] }, { "kind": "type", "rules": [ "misc" ] } ], "name": "vllm.v1.attention.backends.fa_utils", "names": [ "vllm.v1.attention.backends.fa_utils.flash_attn_supports_fp8", "vllm.v1.attention.backends.fa_utils.flash_attn_supports_mla", "vllm.v1.attention.backends.fa_utils.flash_attn_supports_sinks", "vllm.v1.attention.backends.fa_utils.flash_attn_varlen_func", "vllm.v1.attention.backends.fa_utils.get_flash_attn_version", "vllm.v1.attention.backends.fa_utils.get_scheduler_metadata", "vllm.v1.attention.backends.fa_utils.is_flash_attn_varlen_func_available", "vllm.v1.attention.backends.fa_utils.logger" ], "n_typable": 14, "n_typed": 7, "n_any": 5, "n_untyped": 2, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 5 }, { "path": "vllm/v1/attention/backends/flash_attn.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.attention.backends.flash_attn.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.attention.backends.flash_attn.cascade_attention", "n_typed": 25, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 25, "n_params": 24, "n_function_overloads": 1, "n_function_params": 24 }, { "kind": "class", "name": "vllm.v1.attention.backends.flash_attn.FlashAttentionBackend", "methods": [ { "kind": "function", "name": "FlashAttentionBackend.get_supported_kernel_block_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackend.supports_attn_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashAttentionBackend.supports_per_head_quant_scales", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FlashAttentionBackend.get_kv_cache_stride_order", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashAttentionBackend.get_fp8_dtype_for_flashattn", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashAttentionBackend.supports_head_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashAttentionBackend.supports_kv_cache_dtype", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashAttentionBackend.supports_sink", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackend.supports_compute_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashAttentionBackend.supports_combination", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttentionBackend.accept_output_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackend.forward_includes_kv_cache_update", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 36, "n_typed": 36, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 19, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.flash_attn.FlashAttentionImpl", "methods": [ { "kind": "function", "name": "FlashAttentionImpl.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "FlashAttentionImpl.forward", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "FlashAttentionImpl.do_kv_cache_update", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FlashAttentionImpl._forward_with_dcp", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "FlashAttentionImpl._forward_encoder_attention", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttentionImpl.can_return_lse_for_decode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionImpl.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionImpl.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionImpl.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionImpl.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionImpl.alibi_slopes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionImpl.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionImpl.logits_soft_cap", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionImpl.kv_sharing_target_layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionImpl.num_queries_per_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionImpl.attn_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionImpl.vllm_flash_attn_version", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionImpl.batch_invariant_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionImpl.sinks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionImpl.supports_quant_query_input", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionImpl.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 62, "n_typed": 47, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 41, "n_attrs": 16, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.flash_attn.FlashAttentionMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttentionMetadata.num_actual_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.use_cascade", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.common_prefix_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.cu_prefix_query_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.prefix_kv_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.suffix_kv_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.max_dcp_context_kv_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.dcp_context_kv_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.scheduler_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.prefix_scheduler_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.max_num_splits", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionMetadata.causal", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.flash_attn.FlashAttentionMetadataBuilder", "methods": [ { "kind": "function", "name": "FlashAttentionMetadataBuilder.get_cudagraph_support", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlashAttentionMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashAttentionMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FlashAttentionMetadataBuilder.update_block_table", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FlashAttentionMetadataBuilder.use_cascade_attention", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttentionMetadataBuilder._cudagraph_support", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.supports_update_block_table", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.attention_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.num_heads_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.num_heads_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.headdim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.max_num_splits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.aot_schedule", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.cp_kv_cache_interleave_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.use_full_cuda_graph", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.max_cudagraph_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.aot_sliding_window", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.dcp_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.dcp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionMetadataBuilder.scheduler_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 18, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 14, "n_attrs": 21, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.flash_attn.use_cascade_attention", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.flash_attn", "names": [ "vllm.v1.attention.backends.flash_attn.FlashAttentionBackend", "vllm.v1.attention.backends.flash_attn.FlashAttentionImpl", "vllm.v1.attention.backends.flash_attn.FlashAttentionMetadata", "vllm.v1.attention.backends.flash_attn.FlashAttentionMetadataBuilder", "vllm.v1.attention.backends.flash_attn.cascade_attention", "vllm.v1.attention.backends.flash_attn.logger", "vllm.v1.attention.backends.flash_attn.use_cascade_attention" ], "n_typable": 174, "n_typed": 136, "n_any": 0, "n_untyped": 38, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 33, "n_methods": 24, "n_method_overloads": 24, "n_method_params": 74, "n_classes": 4, "n_attrs": 59, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/flash_attn_diffkv.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.flash_attn_diffkv.FlashAttentionDiffKVImpl", "methods": [ { "kind": "function", "name": "FlashAttentionDiffKVImpl.forward", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.flash_attn_diffkv.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.flash_attn_diffkv.FlashAttentionDiffKVBackend", "methods": [ { "kind": "function", "name": "FlashAttentionDiffKVBackend.set_head_size_v", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashAttentionDiffKVBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionDiffKVBackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionDiffKVBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FlashAttentionDiffKVBackend.get_kv_cache_stride_order", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttentionDiffKVBackend.head_size_v", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 13, "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 7, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.flash_attn_diffkv", "names": [ "vllm.v1.attention.backends.flash_attn_diffkv.FlashAttentionDiffKVBackend", "vllm.v1.attention.backends.flash_attn_diffkv.FlashAttentionDiffKVImpl", "vllm.v1.attention.backends.flash_attn_diffkv.logger" ], "n_typable": 24, "n_typed": 23, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 16, "n_classes": 2, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/flashinfer.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.flashinfer.FlashInferBackend", "methods": [ { "kind": "function", "name": "FlashInferBackend.get_supported_kernel_block_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferBackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FlashInferBackend.get_kv_cache_stride_order", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferBackend.get_fp8_dtype_for_flashinfer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferBackend.get_supported_head_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferBackend.supports_compute_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferBackend.supports_sink", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferBackend.get_required_kv_cache_layout", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferBackend.accept_output_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferBackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferBackend.supported_kv_cache_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferBackend.forward_includes_kv_cache_update", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 23, "n_typed": 23, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.flashinfer.BatchDCPPrefillWrapper", "methods": [ { "kind": "function", "name": "BatchDCPPrefillWrapper.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BatchDCPPrefillWrapper.plan", "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "BatchDCPPrefillWrapper.run", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [], "n_typable": 26, "n_typed": 23, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 23, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.flashinfer.FIDecode", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FIDecode.wrapper", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.flashinfer.TRTLLMDecode", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TRTLLMDecode.block_tables", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TRTLLMDecode.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TRTLLMDecode.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.flashinfer.FIPrefill", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FIPrefill.wrapper", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.flashinfer.trtllm_gen_workspace_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.flashinfer.fast_plan_decode", "n_typed": 21, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 22, "n_params": 21, "n_function_overloads": 1, "n_function_params": 21 }, { "kind": "attr", "name": "vllm.v1.attention.backends.flashinfer.FP8_DTYPE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.flashinfer.TRTLLMPrefill", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TRTLLMPrefill.block_tables", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TRTLLMPrefill.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TRTLLMPrefill.cum_seq_lens_q", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TRTLLMPrefill.cum_seq_lens_kv", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TRTLLMPrefill.max_q_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TRTLLMPrefill.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.flashinfer.FlashInferMetadataBuilder", "methods": [ { "kind": "function", "name": "FlashInferMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashInferMetadataBuilder._make_buffer", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlashInferMetadataBuilder.get_cudagraph_support", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlashInferMetadataBuilder._get_workspace_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferMetadataBuilder.set_workspace_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferMetadataBuilder._get_prefill_wrapper", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferMetadataBuilder._get_decode_wrapper", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlashInferMetadataBuilder._get_cascade_wrapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferMetadataBuilder._compute_flashinfer_kv_metadata", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FlashInferMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FlashInferMetadataBuilder.use_cascade_attention", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferMetadataBuilder.reorder_batch_threshold", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.attention_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.enable_cuda_graph", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.use_dcp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.num_qo_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.page_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.use_trtllm_decode_attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.global_hyperparameters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.sm_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.window_left", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.logits_soft_cap", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.has_sinks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.pin_memory", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.paged_kv_indptr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.paged_kv_indptr_cpu_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.paged_kv_indices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.paged_kv_last_page_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.decode_fixed_split_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.prefill_fixed_split_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.disable_split_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.dcp_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.dcp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.dcp_kv_cache_interleave_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMetadataBuilder.q_data_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 63, "n_typed": 26, "n_any": 0, "n_untyped": 37, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 21, "n_attrs": 31, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.flashinfer.FlashInferMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferMetadata.num_actual_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMetadata.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMetadata.q_data_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMetadata.num_decodes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMetadata.num_decode_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMetadata.num_prefills", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMetadata.num_prefill_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMetadata.prefill", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMetadata.decode", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMetadata.use_cascade", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMetadata.cascade_wrapper", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 11, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.flashinfer.trtllm_prefill_attn_kvfp8_dequant", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "attr", "name": "vllm.v1.attention.backends.flashinfer.FLASHINFER_WORKSPACE_BUFFER_SIZE_BATCH_INVARIANT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.flashinfer.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.flashinfer.FlashInferImpl", "methods": [ { "kind": "function", "name": "FlashInferImpl.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "FlashInferImpl.fused_output_quant_supported", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferImpl.process_weights_after_loading", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferImpl.forward", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "FlashInferImpl.do_kv_cache_update", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferImpl.can_return_lse_for_decode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.alibi_slopes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.window_left", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.logits_soft_cap", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.kv_sharing_target_layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.num_queries_per_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.sinks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.support_trtllm_attn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.supports_quant_query_input", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.bmm1_scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.bmm2_scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.o_sf_scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferImpl.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 50, "n_typed": 35, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 27, "n_attrs": 18, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": [ "misc" ] } ], "name": "vllm.v1.attention.backends.flashinfer", "names": [ "vllm.v1.attention.backends.flashinfer.BatchDCPPrefillWrapper", "vllm.v1.attention.backends.flashinfer.FIDecode", "vllm.v1.attention.backends.flashinfer.FIPrefill", "vllm.v1.attention.backends.flashinfer.FLASHINFER_WORKSPACE_BUFFER_SIZE_BATCH_INVARIANT", "vllm.v1.attention.backends.flashinfer.FP8_DTYPE", "vllm.v1.attention.backends.flashinfer.FlashInferBackend", "vllm.v1.attention.backends.flashinfer.FlashInferImpl", "vllm.v1.attention.backends.flashinfer.FlashInferMetadata", "vllm.v1.attention.backends.flashinfer.FlashInferMetadataBuilder", "vllm.v1.attention.backends.flashinfer.TRTLLMDecode", "vllm.v1.attention.backends.flashinfer.TRTLLMPrefill", "vllm.v1.attention.backends.flashinfer.fast_plan_decode", "vllm.v1.attention.backends.flashinfer.logger", "vllm.v1.attention.backends.flashinfer.trtllm_gen_workspace_buffer", "vllm.v1.attention.backends.flashinfer.trtllm_prefill_attn_kvfp8_dequant" ], "n_typable": 192, "n_typed": 134, "n_any": 0, "n_untyped": 58, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 26, "n_methods": 30, "n_method_overloads": 30, "n_method_params": 79, "n_classes": 9, "n_attrs": 79, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/v1/attention/backends/flex_attention.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.flex_attention.FlexAttentionBackend", "methods": [ { "kind": "function", "name": "FlexAttentionBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlexAttentionBackend.supports_attn_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlexAttentionBackend.supports_mm_prefix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlexAttentionBackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlexAttentionBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FlexAttentionBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlexAttentionBackend.use_cascade_attention", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlexAttentionBackend.get_supported_head_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlexAttentionBackend.accept_output_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionBackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionBackend.supported_kv_cache_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 19, "n_typed": 17, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 8, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.flex_attention.physical_to_logical_mapping", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.v1.attention.backends.flex_attention.flex_attention_compiled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.flex_attention.FlexAttentionMetadataBuilder", "methods": [ { "kind": "function", "name": "FlexAttentionMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlexAttentionMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FlexAttentionMetadataBuilder.use_cascade_attention", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlexAttentionMetadataBuilder.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionMetadataBuilder.parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionMetadataBuilder.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionMetadataBuilder.num_heads_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionMetadataBuilder.num_heads_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionMetadataBuilder.headdim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionMetadataBuilder.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionMetadataBuilder.kv_cache_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionMetadataBuilder.direct_build", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionMetadataBuilder.q_block_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionMetadataBuilder.kv_block_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 23, "n_typed": 12, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 11, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.flex_attention.causal_mask_mod", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.v1.attention.backends.flex_attention.get_kernel_options", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.v1.attention.backends.flex_attention.pad_to_multiple", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.v1.attention.backends.flex_attention.FlexAttentionMetadata", "methods": [ { "kind": "function", "name": "FlexAttentionMetadata._convert_physical_to_logical", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FlexAttentionMetadata.get_causal_mask_mod", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlexAttentionMetadata.get_bidirectional_mask_mod", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlexAttentionMetadata.get_sliding_window_mask_mod", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlexAttentionMetadata.get_prefix_lm_mask_mod", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlexAttentionMetadata.get_mask_mod", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlexAttentionMetadata.get_transformed_score_mod", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlexAttentionMetadata._build_block_mask_direct", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlexAttentionMetadata.build_block_mask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlexAttentionMetadata.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "FlexAttentionMetadata.logical_block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FlexAttentionMetadata.causal", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.num_actual_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.use_cascade", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.common_prefix_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.cu_prefix_query_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.prefix_kv_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.suffix_kv_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.total_cache_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.max_possible_sequence_length", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.physical_to_logical", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.decode_offset", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.num_blocks_per_seq", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.num_input_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.num_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.block_mask", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.score_mod", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.logical_mask_mod", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.doc_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.direct_build", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.q_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.kv_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.transformed_score_mod", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlexAttentionMetadata.mm_prefix_range", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 14, "n_typed": 11, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 3, "n_attrs": 32, "n_properties": 1 }, { "kind": "attr", "name": "vllm.v1.attention.backends.flex_attention.create_block_mask_compiled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.flex_attention.FlexAttentionImpl", "methods": [ { "kind": "function", "name": "FlexAttentionImpl.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "FlexAttentionImpl.view_as_4d", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlexAttentionImpl.forward", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlexAttentionImpl.sliding_window", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionImpl.alibi_slopes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionImpl.logits_soft_cap", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionImpl.mm_prefix_range", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionImpl.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionImpl.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionImpl.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionImpl.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionImpl.attn_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionImpl.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlexAttentionImpl.num_queries_per_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 27, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 21, "n_attrs": 11, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.flex_attention.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.attention.backends.flex_attention.unique_static_unsorted", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.flex_attention", "names": [ "vllm.v1.attention.backends.flex_attention.FlexAttentionBackend", "vllm.v1.attention.backends.flex_attention.FlexAttentionImpl", "vllm.v1.attention.backends.flex_attention.FlexAttentionMetadata", "vllm.v1.attention.backends.flex_attention.FlexAttentionMetadataBuilder", "vllm.v1.attention.backends.flex_attention.causal_mask_mod", "vllm.v1.attention.backends.flex_attention.create_block_mask_compiled", "vllm.v1.attention.backends.flex_attention.flex_attention_compiled", "vllm.v1.attention.backends.flex_attention.get_kernel_options", "vllm.v1.attention.backends.flex_attention.logger", "vllm.v1.attention.backends.flex_attention.pad_to_multiple", "vllm.v1.attention.backends.flex_attention.physical_to_logical_mapping", "vllm.v1.attention.backends.flex_attention.unique_static_unsorted" ], "n_typable": 119, "n_typed": 87, "n_any": 0, "n_untyped": 32, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 20, "n_methods": 24, "n_method_overloads": 24, "n_method_params": 41, "n_classes": 4, "n_attrs": 60, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/gdn_attn.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.gdn_attn.GDNAttentionMetadataBuilder", "methods": [ { "kind": "function", "name": "GDNAttentionMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GDNAttentionMetadataBuilder.build", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "GDNAttentionMetadataBuilder.build_for_cudagraph_capture", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GDNAttentionMetadataBuilder._cudagraph_support", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.reorder_batch_threshold", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.speculative_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.kv_cache_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.use_spec_decode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.use_full_cuda_graph", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.decode_cudagraph_max_bs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.spec_state_indices_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.non_spec_state_indices_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.spec_sequence_masks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.spec_token_indx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.non_spec_token_indx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.spec_query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.non_spec_query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.num_accepted_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GDNAttentionMetadataBuilder.num_spec", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 30, "n_typed": 13, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.gdn_attn.GDNAttentionBackend", "methods": [ { "kind": "function", "name": "GDNAttentionBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GDNAttentionBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.gdn_attn.GDNAttentionMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "GDNAttentionMetadata.num_prefills", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.num_prefill_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.num_decodes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.num_decode_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.num_spec_decodes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.num_spec_decode_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.num_actual_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.has_initial_state", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.spec_query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.non_spec_query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.spec_state_indices_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.non_spec_state_indices_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.spec_sequence_masks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.spec_token_indx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.non_spec_token_indx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.num_accepted_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.nums_dict", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.batch_ptr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GDNAttentionMetadata.token_chunk_offset_ptr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 19, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.gdn_attn", "names": [ "vllm.v1.attention.backends.gdn_attn.GDNAttentionBackend", "vllm.v1.attention.backends.gdn_attn.GDNAttentionMetadata", "vllm.v1.attention.backends.gdn_attn.GDNAttentionMetadataBuilder" ], "n_typable": 32, "n_typed": 15, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_classes": 3, "n_attrs": 37, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/linear_attn.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.linear_attn.LinearAttentionMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LinearAttentionMetadata.num_prefills", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LinearAttentionMetadata.num_prefill_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LinearAttentionMetadata.num_decodes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LinearAttentionMetadata.num_decode_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LinearAttentionMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LinearAttentionMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LinearAttentionMetadata.state_indices_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.linear_attn.LinearAttentionMetadataBuilder", "methods": [ { "kind": "function", "name": "LinearAttentionMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LinearAttentionMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LinearAttentionMetadataBuilder.reorder_batch_threshold", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LinearAttentionMetadataBuilder._cudagraph_support", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 10, "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.linear_attn.LinearAttentionBackend", "methods": [ { "kind": "function", "name": "LinearAttentionBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LinearAttentionBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.linear_attn", "names": [ "vllm.v1.attention.backends.linear_attn.LinearAttentionBackend", "vllm.v1.attention.backends.linear_attn.LinearAttentionMetadata", "vllm.v1.attention.backends.linear_attn.LinearAttentionMetadataBuilder" ], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_classes": 3, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/mamba1_attn.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.mamba1_attn.Mamba1AttentionBackend", "methods": [ { "kind": "function", "name": "Mamba1AttentionBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Mamba1AttentionBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mamba1_attn.Mamba1AttentionMetadata", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mamba1_attn.Mamba1AttentionMetadataBuilder", "methods": [ { "kind": "function", "name": "Mamba1AttentionMetadataBuilder.build", "n_typed": 4, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Mamba1AttentionMetadataBuilder.metadata_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 5, "n_typed": 4, "n_any": 1, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.mamba1_attn", "names": [ "vllm.v1.attention.backends.mamba1_attn.Mamba1AttentionBackend", "vllm.v1.attention.backends.mamba1_attn.Mamba1AttentionMetadata", "vllm.v1.attention.backends.mamba1_attn.Mamba1AttentionMetadataBuilder" ], "n_typable": 7, "n_typed": 6, "n_any": 1, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_classes": 3, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/mamba2_attn.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.mamba2_attn.Mamba2AttentionBackend", "methods": [ { "kind": "function", "name": "Mamba2AttentionBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Mamba2AttentionBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mamba2_attn.Mamba2AttentionMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Mamba2AttentionMetadata.prep_initial_states", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Mamba2AttentionMetadata.chunk_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Mamba2AttentionMetadata.seq_idx_p", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mamba2_attn.Mamba2AttentionMetadataBuilder", "methods": [ { "kind": "function", "name": "Mamba2AttentionMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Mamba2AttentionMetadataBuilder.build", "n_typed": 4, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Mamba2AttentionMetadataBuilder.metadata_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Mamba2AttentionMetadataBuilder.chunk_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 11, "n_typed": 9, "n_any": 1, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.mamba2_attn.compute_varlen_chunk_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.mamba2_attn", "names": [ "vllm.v1.attention.backends.mamba2_attn.Mamba2AttentionBackend", "vllm.v1.attention.backends.mamba2_attn.Mamba2AttentionMetadata", "vllm.v1.attention.backends.mamba2_attn.Mamba2AttentionMetadataBuilder", "vllm.v1.attention.backends.mamba2_attn.compute_varlen_chunk_metadata" ], "n_typable": 16, "n_typed": 14, "n_any": 1, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_classes": 3, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/mamba_attn.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.mamba_attn.BaseMambaAttentionMetadataBuilder", "methods": [ { "kind": "function", "name": "BaseMambaAttentionMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaseMambaAttentionMetadataBuilder.build_for_cudagraph_capture", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseMambaAttentionMetadataBuilder.build", "n_typed": 5, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BaseMambaAttentionMetadataBuilder._compute_chunk_metadata", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BaseMambaAttentionMetadataBuilder._build_chunk_metadata_tensors", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BaseMambaAttentionMetadataBuilder._compute_prefix_caching_block_indices", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMambaAttentionMetadataBuilder._compute_common_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseMambaAttentionMetadataBuilder._update_metadata_for_cudagraph_capture", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseMambaAttentionMetadataBuilder.update_block_table", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseMambaAttentionMetadataBuilder.metadata_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseMambaAttentionMetadataBuilder.reorder_batch_threshold", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseMambaAttentionMetadataBuilder._cudagraph_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseMambaAttentionMetadataBuilder.supports_update_block_table", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseMambaAttentionMetadataBuilder.speculative_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseMambaAttentionMetadataBuilder.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseMambaAttentionMetadataBuilder.num_spec_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BaseMambaAttentionMetadataBuilder.use_spec_decode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseMambaAttentionMetadataBuilder.decode_cudagraph_max_bs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseMambaAttentionMetadataBuilder.state_indices_tensor_d", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseMambaAttentionMetadataBuilder.block_idx_last_scheduled_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseMambaAttentionMetadataBuilder.block_idx_last_computed_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseMambaAttentionMetadataBuilder.decode_num_accepted_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 47, "n_typed": 37, "n_any": 1, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 25, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mamba_attn.BaseMambaAttentionMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseMambaAttentionMetadata.num_prefills", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.num_prefill_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.num_decodes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.num_decode_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.has_initial_states_p", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.query_start_loc_p", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.num_computed_tokens_p", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.state_indices_tensor_p", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.state_indices_tensor_d", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.query_start_loc_d", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.num_accepted_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.block_idx_last_scheduled_token", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.block_idx_first_scheduled_token_p", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.block_idx_last_computed_token", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.cu_chunk_seqlen_p", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.last_chunk_indices_p", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.nums_dict", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.batch_ptr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseMambaAttentionMetadata.token_chunk_offset_ptr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 21, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.mamba_attn.M", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.mamba_attn", "names": [ "vllm.v1.attention.backends.mamba_attn.BaseMambaAttentionMetadata", "vllm.v1.attention.backends.mamba_attn.BaseMambaAttentionMetadataBuilder", "vllm.v1.attention.backends.mamba_attn.M" ], "n_typable": 47, "n_typed": 37, "n_any": 1, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 25, "n_classes": 2, "n_attrs": 35, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/mla/aiter_triton_mla.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.mla.aiter_triton_mla.AiterTritonMLAImpl", "methods": [ { "kind": "function", "name": "AiterTritonMLAImpl.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "AiterTritonMLAImpl._flash_attn_varlen_diff_headdims", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterTritonMLAImpl.flash_attn_varlen_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 11, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 17, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.aiter_triton_mla.AiterTritonMLABackend", "methods": [ { "kind": "function", "name": "AiterTritonMLABackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterTritonMLABackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.mla.aiter_triton_mla", "names": [ "vllm.v1.attention.backends.mla.aiter_triton_mla.AiterTritonMLABackend", "vllm.v1.attention.backends.mla.aiter_triton_mla.AiterTritonMLAImpl" ], "n_typable": 22, "n_typed": 13, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 17, "n_classes": 2, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/mla/cutlass_mla.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.mla.cutlass_mla.CutlassMLAMetadataBuilder", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CutlassMLAMetadataBuilder._cudagraph_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.mla.cutlass_mla.MAX_HEADS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.mla.cutlass_mla.g_sm100_workspace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.cutlass_mla.SM100Workspace", "methods": [ { "kind": "function", "name": "SM100Workspace.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SM100Workspace.get_buf", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SM100Workspace.ensure_size", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 2, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.cutlass_mla.CutlassMLABackend", "methods": [ { "kind": "function", "name": "CutlassMLABackend.get_supported_kernel_block_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassMLABackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassMLABackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassMLABackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CutlassMLABackend.supports_compute_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CutlassMLABackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CutlassMLABackend.supported_kv_cache_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.mla.cutlass_mla.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.cutlass_mla.CutlassMLAImpl", "methods": [ { "kind": "function", "name": "CutlassMLAImpl.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "CutlassMLAImpl._sm100_cutlass_mla_decode", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "CutlassMLAImpl.forward_mqa", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CutlassMLAImpl.can_return_lse_for_decode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 27, "n_typed": 26, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 23, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.mla.cutlass_mla", "names": [ "vllm.v1.attention.backends.mla.cutlass_mla.CutlassMLABackend", "vllm.v1.attention.backends.mla.cutlass_mla.CutlassMLAImpl", "vllm.v1.attention.backends.mla.cutlass_mla.CutlassMLAMetadataBuilder", "vllm.v1.attention.backends.mla.cutlass_mla.MAX_HEADS", "vllm.v1.attention.backends.mla.cutlass_mla.SM100Workspace", "vllm.v1.attention.backends.mla.cutlass_mla.g_sm100_workspace", "vllm.v1.attention.backends.mla.cutlass_mla.logger" ], "n_typable": 44, "n_typed": 37, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 27, "n_classes": 4, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/mla/flashattn_mla.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashattn_mla.FlashAttnMLADecodeMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttnMLADecodeMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttnMLADecodeMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttnMLADecodeMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttnMLADecodeMetadata.scheduler_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttnMLADecodeMetadata.max_num_splits", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashattn_mla.FlashAttnMLABackend", "methods": [ { "kind": "function", "name": "FlashAttnMLABackend.get_supported_kernel_block_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttnMLABackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttnMLABackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttnMLABackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttnMLABackend.supports_compute_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashAttnMLABackend.supports_combination", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttnMLABackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttnMLABackend.supported_kv_cache_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 17, "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashattn_mla.FlashAttnMLAImpl", "methods": [ { "kind": "function", "name": "FlashAttnMLAImpl.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "FlashAttnMLAImpl.forward_mqa", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttnMLAImpl.can_return_lse_for_decode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 18, "n_typed": 17, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 15, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashattn_mla.FlashAttnMLAMetadataBuilder", "methods": [ { "kind": "function", "name": "FlashAttnMLAMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashAttnMLAMetadataBuilder._schedule_decode", "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "FlashAttnMLAMetadataBuilder._build_decode", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttnMLAMetadataBuilder._cudagraph_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttnMLAMetadataBuilder.query_len_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttnMLAMetadataBuilder.reorder_batch_threshold", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttnMLAMetadataBuilder.max_num_splits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttnMLAMetadataBuilder.fa_aot_schedule", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttnMLAMetadataBuilder.use_full_cuda_graph", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttnMLAMetadataBuilder.max_cudagraph_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttnMLAMetadataBuilder.scheduler_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 15, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 18, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.mla.flashattn_mla.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashattn_mla.FlashAttnMLAMetadata", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.mla.flashattn_mla", "names": [ "vllm.v1.attention.backends.mla.flashattn_mla.FlashAttnMLABackend", "vllm.v1.attention.backends.mla.flashattn_mla.FlashAttnMLADecodeMetadata", "vllm.v1.attention.backends.mla.flashattn_mla.FlashAttnMLAImpl", "vllm.v1.attention.backends.mla.flashattn_mla.FlashAttnMLAMetadata", "vllm.v1.attention.backends.mla.flashattn_mla.FlashAttnMLAMetadataBuilder", "vllm.v1.attention.backends.mla.flashattn_mla.logger" ], "n_typable": 65, "n_typed": 49, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 42, "n_classes": 5, "n_attrs": 17, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/mla/flashinfer_mla.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashinfer_mla.FlashInferMLAMetadataBuilder", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferMLAMetadataBuilder._cudagraph_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLAMetadataBuilder.query_len_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashinfer_mla.FlashInferMLAImpl", "methods": [ { "kind": "function", "name": "FlashInferMLAImpl.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "FlashInferMLAImpl.forward_mqa", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferMLAImpl.bmm1_scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLAImpl.bmm2_scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 19, "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 15, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashinfer_mla.FlashInferMLABackend", "methods": [ { "kind": "function", "name": "FlashInferMLABackend.get_supported_kernel_block_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferMLABackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferMLABackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferMLABackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferMLABackend.supports_compute_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferMLABackend.supports_combination", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "FlashInferMLABackend.get_required_kv_cache_layout", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferMLABackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLABackend.supported_kv_cache_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 18, "n_typed": 18, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 9, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.mla.flashinfer_mla.FLASHINFER_MLA_WORKSPACE_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.mla.flashinfer_mla.g_fi_workspace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.attention.backends.mla.flashinfer_mla.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.mla.flashinfer_mla", "names": [ "vllm.v1.attention.backends.mla.flashinfer_mla.FLASHINFER_MLA_WORKSPACE_BUFFER_SIZE", "vllm.v1.attention.backends.mla.flashinfer_mla.FlashInferMLABackend", "vllm.v1.attention.backends.mla.flashinfer_mla.FlashInferMLAImpl", "vllm.v1.attention.backends.mla.flashinfer_mla.FlashInferMLAMetadataBuilder", "vllm.v1.attention.backends.mla.flashinfer_mla.g_fi_workspace", "vllm.v1.attention.backends.mla.flashinfer_mla.logger" ], "n_typable": 41, "n_typed": 38, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 24, "n_classes": 3, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/mla/flashinfer_mla_sparse.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashinfer_mla_sparse.FlashInferMLASparseBackend", "methods": [ { "kind": "function", "name": "FlashInferMLASparseBackend.get_supported_kernel_block_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferMLASparseBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferMLASparseBackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferMLASparseBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferMLASparseBackend.get_supported_head_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferMLASparseBackend.is_mla", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferMLASparseBackend.is_sparse", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashInferMLASparseBackend.supports_compute_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashInferMLASparseBackend.supports_combination", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "FlashInferMLASparseBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FlashInferMLASparseBackend.get_required_kv_cache_layout", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferMLASparseBackend.accept_output_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseBackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseBackend.supported_kv_cache_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 28, "n_typed": 28, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 14, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.mla.flashinfer_mla_sparse.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashinfer_mla_sparse.FlashInferMLASparseImpl", "methods": [ { "kind": "function", "name": "FlashInferMLASparseImpl.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "FlashInferMLASparseImpl.forward_mqa", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferMLASparseImpl.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseImpl.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseImpl.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseImpl.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseImpl.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseImpl.kv_lora_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseImpl.qk_nope_head_dim", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseImpl.qk_rope_head_dim", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseImpl.topk_indices_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseImpl.bmm1_scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseImpl.bmm2_scale", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 30, "n_typed": 24, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 17, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashinfer_mla_sparse.FlashInferMLASparseMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferMLASparseMetadata.num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMLASparseMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMLASparseMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMLASparseMetadata.num_actual_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMLASparseMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMLASparseMetadata.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMLASparseMetadata.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMLASparseMetadata.req_id_per_token", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMLASparseMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMLASparseMetadata.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashInferMLASparseMetadata.topk_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 11, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.mla.flashinfer_mla_sparse.FLASHINFER_MLA_SPARSE_WORKSPACE_BUFFER_SIZE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashinfer_mla_sparse.FlashInferMLASparseMetadataBuilder", "methods": [ { "kind": "function", "name": "FlashInferMLASparseMetadataBuilder.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashInferMLASparseMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashInferMLASparseMetadataBuilder._cudagraph_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseMetadataBuilder.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseMetadataBuilder.layer_names", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseMetadataBuilder.kv_cache_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseMetadataBuilder.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseMetadataBuilder.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseMetadataBuilder.mla_dims", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseMetadataBuilder.topk_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashInferMLASparseMetadataBuilder.req_id_per_token_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 10, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.mla.flashinfer_mla_sparse", "names": [ "vllm.v1.attention.backends.mla.flashinfer_mla_sparse.FLASHINFER_MLA_SPARSE_WORKSPACE_BUFFER_SIZE", "vllm.v1.attention.backends.mla.flashinfer_mla_sparse.FlashInferMLASparseBackend", "vllm.v1.attention.backends.mla.flashinfer_mla_sparse.FlashInferMLASparseImpl", "vllm.v1.attention.backends.mla.flashinfer_mla_sparse.FlashInferMLASparseMetadata", "vllm.v1.attention.backends.mla.flashinfer_mla_sparse.FlashInferMLASparseMetadataBuilder", "vllm.v1.attention.backends.mla.flashinfer_mla_sparse.logger" ], "n_typable": 77, "n_typed": 62, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 38, "n_classes": 4, "n_attrs": 36, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/mla/flashmla.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashmla.FlashMLADecodeMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashMLADecodeMetadata.scheduler_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashmla.FlashMLABackend", "methods": [ { "kind": "function", "name": "FlashMLABackend.get_supported_kernel_block_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashMLABackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashMLABackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashMLABackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashMLABackend.supports_compute_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashMLABackend.supports_combination", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashMLABackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLABackend.supported_kv_cache_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 17, "n_typed": 17, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashmla.FlashMLAImpl", "methods": [ { "kind": "function", "name": "FlashMLAImpl.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "FlashMLAImpl.forward_mqa", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashMLAImpl.can_return_lse_for_decode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 18, "n_typed": 17, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 15, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashmla.FlashMLAMetadataBuilder", "methods": [ { "kind": "function", "name": "FlashMLAMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashMLAMetadataBuilder._build_decode", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashMLAMetadataBuilder._cudagraph_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLAMetadataBuilder.query_len_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLAMetadataBuilder.reorder_batch_threshold", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLAMetadataBuilder.num_q_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLAMetadataBuilder.cg_buf_tile_scheduler_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLAMetadataBuilder.cg_buf_num_splits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLAMetadataBuilder.is_fp8_kvcache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 20, "n_typed": 15, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.mla.flashmla.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashmla.FlashMLAMetadata", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.mla.flashmla", "names": [ "vllm.v1.attention.backends.mla.flashmla.FlashMLABackend", "vllm.v1.attention.backends.mla.flashmla.FlashMLADecodeMetadata", "vllm.v1.attention.backends.mla.flashmla.FlashMLAImpl", "vllm.v1.attention.backends.mla.flashmla.FlashMLAMetadata", "vllm.v1.attention.backends.mla.flashmla.FlashMLAMetadataBuilder", "vllm.v1.attention.backends.mla.flashmla.logger" ], "n_typable": 56, "n_typed": 49, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 35, "n_classes": 5, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/mla/flashmla_sparse.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashmla_sparse.Decode", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Decode.kernel_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Decode.decode_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashmla_sparse.FlashMLASparseBackend", "methods": [ { "kind": "function", "name": "FlashMLASparseBackend.get_supported_kernel_block_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashMLASparseBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashMLASparseBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashMLASparseBackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashMLASparseBackend.get_supported_head_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashMLASparseBackend.is_mla", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashMLASparseBackend.is_sparse", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashMLASparseBackend.supports_compute_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashMLASparseBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashMLASparseBackend.accept_output_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseBackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseBackend.supported_kv_cache_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 18, "n_typed": 18, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashmla_sparse.Prefill", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Prefill.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Prefill.request_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Prefill.workspace_starts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Prefill.chunks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashmla_sparse.FlashMLASparseMetadataBuilder", "methods": [ { "kind": "function", "name": "FlashMLASparseMetadataBuilder.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashMLASparseMetadataBuilder._build_fp8_mixed_decode_prefill", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashMLASparseMetadataBuilder._build_fp8_separate_prefill_decode", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashMLASparseMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashMLASparseMetadataBuilder._cudagraph_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.layer_names", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.kv_cache_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.mla_dims", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.fp8_decode_padded_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.topk_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.use_fp8_kv_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.topk_tokens_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.max_model_len_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.dummy_block_table", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.tile_scheduler_metadata_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.num_splits_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseMetadataBuilder.req_id_per_token_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 14, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 17, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashmla_sparse.FlashMLASparseImpl", "methods": [ { "kind": "function", "name": "FlashMLASparseImpl._compute_fp8_decode_padded_heads", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashMLASparseImpl.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "FlashMLASparseImpl._forward_bf16_kv", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashMLASparseImpl._forward_fp8_kv_separate_prefill_decode", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashMLASparseImpl._forward_fp8_kv_mixed_batch", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashMLASparseImpl._fp8_flash_mla_kernel", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashMLASparseImpl._bf16_flash_mla_kernel", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FlashMLASparseImpl.forward_mqa", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashMLASparseImpl.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseImpl.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseImpl.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseImpl.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseImpl.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseImpl.kv_lora_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseImpl.softmax_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseImpl.topk_indices_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseImpl.prefill_padding", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseImpl.fp8_decode_padded_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashMLASparseImpl.prefill_workspace_shape", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 56, "n_typed": 46, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 37, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashmla_sparse.Chunk", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Chunk.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Chunk.tokens_slice", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Chunk.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Chunk.req_start_idx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Chunk.workspace_starts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Chunk.chunk_tot_seqlen", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashmla_sparse.FlashMLASparseMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashMLASparseMetadata.num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashMLASparseMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashMLASparseMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashMLASparseMetadata.num_actual_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashMLASparseMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashMLASparseMetadata.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashMLASparseMetadata.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashMLASparseMetadata.req_id_per_token", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashMLASparseMetadata.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashMLASparseMetadata.topk_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashMLASparseMetadata.fp8_extra_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashMLASparseMetadata.fp8_use_mixed_batch", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashmla_sparse.FP8KernelMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FP8KernelMetadata.scheduler_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FP8KernelMetadata.dummy_block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FP8KernelMetadata.cache_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.mla.flashmla_sparse.get_prefill_workspace_size", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.v1.attention.backends.mla.flashmla_sparse.MIN_HEADS_FOR_BF16_PREFILL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.flashmla_sparse.FP8SeparatePrefillDecode", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FP8SeparatePrefillDecode.num_prefills", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FP8SeparatePrefillDecode.num_decodes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FP8SeparatePrefillDecode.num_prefill_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FP8SeparatePrefillDecode.num_decode_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FP8SeparatePrefillDecode.decode", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FP8SeparatePrefillDecode.prefill", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.mla.flashmla_sparse.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.mla.flashmla_sparse", "names": [ "vllm.v1.attention.backends.mla.flashmla_sparse.Chunk", "vllm.v1.attention.backends.mla.flashmla_sparse.Decode", "vllm.v1.attention.backends.mla.flashmla_sparse.FP8KernelMetadata", "vllm.v1.attention.backends.mla.flashmla_sparse.FP8SeparatePrefillDecode", "vllm.v1.attention.backends.mla.flashmla_sparse.FlashMLASparseBackend", "vllm.v1.attention.backends.mla.flashmla_sparse.FlashMLASparseImpl", "vllm.v1.attention.backends.mla.flashmla_sparse.FlashMLASparseMetadata", "vllm.v1.attention.backends.mla.flashmla_sparse.FlashMLASparseMetadataBuilder", "vllm.v1.attention.backends.mla.flashmla_sparse.MIN_HEADS_FOR_BF16_PREFILL", "vllm.v1.attention.backends.mla.flashmla_sparse.Prefill", "vllm.v1.attention.backends.mla.flashmla_sparse.get_prefill_workspace_size", "vllm.v1.attention.backends.mla.flashmla_sparse.logger" ], "n_typable": 107, "n_typed": 79, "n_any": 0, "n_untyped": 28, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 52, "n_classes": 9, "n_attrs": 66, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/mla/indexer.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.attention.backends.mla.indexer.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.indexer.DeepseekV32IndexerMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekV32IndexerMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadata.num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadata.num_actual_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadata.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadata.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadata.num_decodes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadata.num_decode_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadata.num_prefills", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadata.num_prefill_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadata.decode", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadata.prefill", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.indexer.DeepseekV32IndexerPrefillChunkMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekV32IndexerPrefillChunkMetadata.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerPrefillChunkMetadata.cu_seqlen_ks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerPrefillChunkMetadata.cu_seqlen_ke", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerPrefillChunkMetadata.cu_seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerPrefillChunkMetadata.token_to_seq", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerPrefillChunkMetadata.total_seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerPrefillChunkMetadata.token_start", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerPrefillChunkMetadata.token_end", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepseekV32IndexerPrefillChunkMetadata.num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 9, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.mla.indexer.kv_spans_from_batches", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.attention.backends.mla.indexer.get_max_prefill_buffer_size", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.indexer.DeepseekV32IndexerPrefillMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekV32IndexerPrefillMetadata.chunks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.indexer.DeepSeekV32IndexerDecodeMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepSeekV32IndexerDecodeMetadata.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepSeekV32IndexerDecodeMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepSeekV32IndexerDecodeMetadata.decode_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepSeekV32IndexerDecodeMetadata.requires_padding", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepSeekV32IndexerDecodeMetadata.schedule_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepSeekV32IndexerDecodeMetadata.use_large_context_topk", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DeepSeekV32IndexerDecodeMetadata.offsets", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.indexer.DeepseekV32IndexerMetadataBuilder", "methods": [ { "kind": "function", "name": "DeepseekV32IndexerMetadataBuilder.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DeepseekV32IndexerMetadataBuilder.build_one_prefill_chunk", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DeepseekV32IndexerMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DeepseekV32IndexerMetadataBuilder._cudagraph_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadataBuilder.reorder_batch_threshold", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadataBuilder.max_prefill_buffer_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadataBuilder.num_speculative_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadataBuilder.num_sms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadataBuilder.decode_lens_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadataBuilder.arange_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadataBuilder.expanded_seq_lens_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadataBuilder.expanded_block_table_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DeepseekV32IndexerMetadataBuilder.scheduler_metadata_buffer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 6, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 10, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.indexer.DeepseekV32IndexerBackend", "methods": [ { "kind": "function", "name": "DeepseekV32IndexerBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepseekV32IndexerBackend.get_supported_kernel_block_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepseekV32IndexerBackend.get_supported_head_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepseekV32IndexerBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DeepseekV32IndexerBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "DeepseekV32IndexerBackend.get_kv_cache_stride_order", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.mla.indexer", "names": [ "vllm.v1.attention.backends.mla.indexer.DeepSeekV32IndexerDecodeMetadata", "vllm.v1.attention.backends.mla.indexer.DeepseekV32IndexerBackend", "vllm.v1.attention.backends.mla.indexer.DeepseekV32IndexerMetadata", "vllm.v1.attention.backends.mla.indexer.DeepseekV32IndexerMetadataBuilder", "vllm.v1.attention.backends.mla.indexer.DeepseekV32IndexerPrefillChunkMetadata", "vllm.v1.attention.backends.mla.indexer.DeepseekV32IndexerPrefillMetadata", "vllm.v1.attention.backends.mla.indexer.get_max_prefill_buffer_size", "vllm.v1.attention.backends.mla.indexer.kv_spans_from_batches", "vllm.v1.attention.backends.mla.indexer.logger" ], "n_typable": 42, "n_typed": 23, "n_any": 0, "n_untyped": 19, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 4, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 16, "n_classes": 6, "n_attrs": 42, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/mla/rocm_aiter_mla.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.mla.rocm_aiter_mla.AiterMLADecodeMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterMLADecodeMetadata.paged_kv_indptr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterMLADecodeMetadata.paged_kv_indices", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterMLADecodeMetadata.paged_kv_last_page_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterMLADecodeMetadata.qo_indptr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterMLADecodeMetadata.attn_out_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterMLADecodeMetadata.max_qo_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.rocm_aiter_mla.AiterMLAImpl", "methods": [ { "kind": "function", "name": "AiterMLAImpl.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "AiterMLAImpl._flash_attn_varlen_diff_headdims", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "AiterMLAImpl.forward_mqa", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterMLAImpl.flash_attn_varlen_func", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 16, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 21, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.rocm_aiter_mla.AiterMLABackend", "methods": [ { "kind": "function", "name": "AiterMLABackend.get_supported_kernel_block_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterMLABackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterMLABackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterMLABackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.rocm_aiter_mla.AiterMLAMetadataBuilder", "methods": [ { "kind": "function", "name": "AiterMLAMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AiterMLAMetadataBuilder._build_decode", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterMLAMetadataBuilder._cudagraph_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AiterMLAMetadataBuilder.query_len_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AiterMLAMetadataBuilder.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterMLAMetadataBuilder.decode_attn_out_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterMLAMetadataBuilder.paged_kv_last_page_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterMLAMetadataBuilder.paged_kv_indptr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterMLAMetadataBuilder.paged_kv_indices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterMLAMetadataBuilder.qo_indptr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 14, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.rocm_aiter_mla.AiterMLAMetadata", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.mla.rocm_aiter_mla", "names": [ "vllm.v1.attention.backends.mla.rocm_aiter_mla.AiterMLABackend", "vllm.v1.attention.backends.mla.rocm_aiter_mla.AiterMLADecodeMetadata", "vllm.v1.attention.backends.mla.rocm_aiter_mla.AiterMLAImpl", "vllm.v1.attention.backends.mla.rocm_aiter_mla.AiterMLAMetadata", "vllm.v1.attention.backends.mla.rocm_aiter_mla.AiterMLAMetadataBuilder" ], "n_typable": 50, "n_typed": 34, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 32, "n_classes": 5, "n_attrs": 15, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/mla/rocm_aiter_mla_sparse.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.ROCMAiterMLASparseBackend", "methods": [ { "kind": "function", "name": "ROCMAiterMLASparseBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ROCMAiterMLASparseBackend.get_metadata_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ROCMAiterMLASparseBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ROCMAiterMLASparseBackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ROCMAiterMLASparseBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ROCMAiterMLASparseBackend.get_supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ROCMAiterMLASparseBackend.get_supported_head_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ROCMAiterMLASparseBackend.accept_output_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 13, "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.fetch_id_to_ragged_kernel", "n_typed": 3, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.fetch_id_to_ragged_triton", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.ROCMAiterMLASparseMetadataBuilder", "methods": [ { "kind": "function", "name": "ROCMAiterMLASparseMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ROCMAiterMLASparseMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ROCMAiterMLASparseMetadataBuilder._cudagraph_support", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.reference_mla_sparse_prefill", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.ROCMAiterMLASparseImpl", "methods": [ { "kind": "function", "name": "ROCMAiterMLASparseImpl.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "ROCMAiterMLASparseImpl._forward_bf16_kv", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ROCMAiterMLASparseImpl.forward_mqa", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ROCMAiterMLASparseImpl.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ROCMAiterMLASparseImpl.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ROCMAiterMLASparseImpl.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ROCMAiterMLASparseImpl.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ROCMAiterMLASparseImpl.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ROCMAiterMLASparseImpl.kv_lora_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ROCMAiterMLASparseImpl.softmax_scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ROCMAiterMLASparseImpl.topk_indices_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 32, "n_typed": 25, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 21, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.ROCMAiterMLASparseMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ROCMAiterMLASparseMetadata.num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROCMAiterMLASparseMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROCMAiterMLASparseMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROCMAiterMLASparseMetadata.num_actual_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROCMAiterMLASparseMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROCMAiterMLASparseMetadata.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROCMAiterMLASparseMetadata.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROCMAiterMLASparseMetadata.req_id_per_token", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROCMAiterMLASparseMetadata.qo_indptr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROCMAiterMLASparseMetadata.paged_kv_last_page_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROCMAiterMLASparseMetadata.paged_kv_indices", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROCMAiterMLASparseMetadata.paged_kv_indptr", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROCMAiterMLASparseMetadata.paged_kv_indptr_rest", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROCMAiterMLASparseMetadata.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ROCMAiterMLASparseMetadata.topk_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 15, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse", "names": [ "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.ROCMAiterMLASparseBackend", "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.ROCMAiterMLASparseImpl", "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.ROCMAiterMLASparseMetadata", "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.ROCMAiterMLASparseMetadataBuilder", "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.fetch_id_to_ragged_kernel", "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.fetch_id_to_ragged_triton", "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.logger", "vllm.v1.attention.backends.mla.rocm_aiter_mla_sparse.reference_mla_sparse_prefill" ], "n_typable": 74, "n_typed": 58, "n_any": 0, "n_untyped": 16, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 16, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 33, "n_classes": 4, "n_attrs": 26, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/mla/sparse_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.attention.backends.mla.sparse_utils.triton_convert_req_index_to_global_index", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.mla.sparse_utils", "names": [ "vllm.v1.attention.backends.mla.sparse_utils.triton_convert_req_index_to_global_index" ], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 10, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/mla/triton_mla.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.attention.backends.mla.triton_mla.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.triton_mla.TritonMLABackend", "methods": [ { "kind": "function", "name": "TritonMLABackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonMLABackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonMLABackend.supports_compute_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TritonMLABackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TritonMLABackend.supported_kv_cache_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.mla.triton_mla.TritonMLAImpl", "methods": [ { "kind": "function", "name": "TritonMLAImpl.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "TritonMLAImpl._flash_attn_varlen_diff_headdims", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "TritonMLAImpl.forward_mqa", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TritonMLAImpl.can_return_lse_for_decode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 25, "n_typed": 17, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 21, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.mla.triton_mla", "names": [ "vllm.v1.attention.backends.mla.triton_mla.TritonMLABackend", "vllm.v1.attention.backends.mla.triton_mla.TritonMLAImpl", "vllm.v1.attention.backends.mla.triton_mla.logger" ], "n_typable": 32, "n_typed": 23, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 22, "n_classes": 2, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/registry.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.attention.backends.registry.MAMBA_TYPE_TO_BACKEND_MAP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.registry.AttentionBackendEnum", "methods": [ { "kind": "function", "name": "AttentionBackendEnum.get_path", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AttentionBackendEnum.get_class", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionBackendEnum.is_overridden", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionBackendEnum.clear_override", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AttentionBackendEnum.FLASH_ATTN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.FLASH_ATTN_DIFFKV", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.TRITON_ATTN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.ROCM_ATTN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.ROCM_AITER_MLA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.ROCM_AITER_TRITON_MLA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.ROCM_AITER_FA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.ROCM_AITER_MLA_SPARSE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.TORCH_SDPA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.FLASHINFER", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.FLASHINFER_MLA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.FLASHINFER_MLA_SPARSE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.TRITON_MLA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.CUTLASS_MLA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.FLASHMLA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.FLASHMLA_SPARSE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.FLASH_ATTN_MLA", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.NO_ATTENTION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.FLEX_ATTENTION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.TREE_ATTN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.ROCM_AITER_UNIFIED_ATTN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.CPU_ATTN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionBackendEnum.CUSTOM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 1, "n_attrs": 23, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.registry.register_backend", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.v1.attention.backends.registry.MambaAttentionBackendEnum", "methods": [ { "kind": "function", "name": "MambaAttentionBackendEnum.get_path", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MambaAttentionBackendEnum.get_class", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MambaAttentionBackendEnum.is_overridden", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MambaAttentionBackendEnum.clear_override", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MambaAttentionBackendEnum.MAMBA1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MambaAttentionBackendEnum.MAMBA2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MambaAttentionBackendEnum.SHORT_CONV", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MambaAttentionBackendEnum.LINEAR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MambaAttentionBackendEnum.GDN_ATTN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MambaAttentionBackendEnum.CUSTOM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 1, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.registry.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.registry", "names": [ "vllm.v1.attention.backends.registry.AttentionBackendEnum", "vllm.v1.attention.backends.registry.MAMBA_TYPE_TO_BACKEND_MAP", "vllm.v1.attention.backends.registry.MambaAttentionBackendEnum", "vllm.v1.attention.backends.registry.logger", "vllm.v1.attention.backends.registry.register_backend" ], "n_typable": 15, "n_typed": 14, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 2, "n_classes": 2, "n_attrs": 31, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/rocm_aiter_fa.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.rocm_aiter_fa.AiterFlashAttentionDecodeMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterFlashAttentionDecodeMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionDecodeMetadata.min_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionDecodeMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionDecodeMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.rocm_aiter_fa.AiterChunkSlidingWindowMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterChunkSlidingWindowMetadata.swa_seqlens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterChunkSlidingWindowMetadata.swa_cu_seqlens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterChunkSlidingWindowMetadata.swa_seq_starts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterChunkSlidingWindowMetadata.swa_token_to_batch", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterChunkSlidingWindowMetadata.swa_max_seqlens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterChunkSlidingWindowMetadata.swa_total_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterChunkSlidingWindowMetadata.swa_workspace", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.rocm_aiter_fa.AiterFlashAttentionChunkPrefillMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterFlashAttentionChunkPrefillMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionChunkPrefillMetadata.min_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionChunkPrefillMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionChunkPrefillMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionChunkPrefillMetadata.chunk_context_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.rocm_aiter_fa.AiterChunkContextMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterChunkContextMetadata.workspace", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterChunkContextMetadata.cu_seq_lens_chunk", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterChunkContextMetadata.chunk_starts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterChunkContextMetadata.token_to_batch", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterChunkContextMetadata.seq_tot", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterChunkContextMetadata.max_seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterChunkContextMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterChunkContextMetadata.num_chunks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterChunkContextMetadata.total_token_per_batch", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterChunkContextMetadata.swa_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 10, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.rocm_aiter_fa.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.attention.backends.rocm_aiter_fa.cp_mha_gather_cache", "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "class", "name": "vllm.v1.attention.backends.rocm_aiter_fa.AiterFlashAttentionMetadataBuilder", "methods": [ { "kind": "function", "name": "AiterFlashAttentionMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AiterFlashAttentionMetadataBuilder.build_for_cudagraph_capture", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AiterFlashAttentionMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AiterFlashAttentionMetadataBuilder.build_for_drafting", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AiterFlashAttentionMetadataBuilder.use_cascade_attention", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterFlashAttentionMetadataBuilder._cudagraph_support", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadataBuilder.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionMetadataBuilder.parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionMetadataBuilder.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionMetadataBuilder.num_heads_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionMetadataBuilder.num_heads_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionMetadataBuilder.headdim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionMetadataBuilder.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionMetadataBuilder.aot_sliding_window", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionMetadataBuilder.total_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionMetadataBuilder.extend_workspace", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionMetadataBuilder.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 15, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.rocm_aiter_fa.AiterFlashAttentionPrefillMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterFlashAttentionPrefillMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionPrefillMetadata.min_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionPrefillMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionPrefillMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.rocm_aiter_fa.reshape_and_cache_shuffle_kernel", "n_typed": 3, "n_any": 0, "n_untyped": 14, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "class", "name": "vllm.v1.attention.backends.rocm_aiter_fa.AiterFlashAttentionImpl", "methods": [ { "kind": "function", "name": "AiterFlashAttentionImpl.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "AiterFlashAttentionImpl.extend_for_sliding_window", "n_typed": 8, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "AiterFlashAttentionImpl.extend_forward", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "AiterFlashAttentionImpl.forward", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "AiterFlashAttentionImpl.do_kv_cache_update", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterFlashAttentionImpl.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionImpl.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionImpl.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionImpl.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionImpl.alibi_slopes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionImpl.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionImpl.logits_soft_cap", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionImpl.kv_sharing_target_layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionImpl.num_queries_per_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionImpl.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 64, "n_typed": 49, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 49, "n_attrs": 10, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.rocm_aiter_fa.reshape_and_cache_shuffle_triton", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.v1.attention.backends.rocm_aiter_fa.cp_mha_gather_cache_kernel", "n_typed": 4, "n_any": 0, "n_untyped": 15, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 }, { "kind": "class", "name": "vllm.v1.attention.backends.rocm_aiter_fa.AiterFlashAttentionMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterFlashAttentionMetadata.num_actual_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.num_actual_kv_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.num_decodes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.num_decode_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.num_prefills", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.num_prefill_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.num_extends", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.num_extend_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.decode_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.prefill_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.extend_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.use_cascade", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.common_prefix_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.total_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.k_scale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AiterFlashAttentionMetadata.v_scale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 22, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.rocm_aiter_fa.num_programs", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.v1.attention.backends.rocm_aiter_fa.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.rocm_aiter_fa.AiterFlashAttentionBackend", "methods": [ { "kind": "function", "name": "AiterFlashAttentionBackend.get_supported_kernel_block_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterFlashAttentionBackend.get_supported_head_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterFlashAttentionBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterFlashAttentionBackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterFlashAttentionBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AiterFlashAttentionBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AiterFlashAttentionBackend.accept_output_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionBackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AiterFlashAttentionBackend.forward_includes_kv_cache_update", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 14, "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.rocm_aiter_fa", "names": [ "vllm.v1.attention.backends.rocm_aiter_fa.AiterChunkContextMetadata", "vllm.v1.attention.backends.rocm_aiter_fa.AiterChunkSlidingWindowMetadata", "vllm.v1.attention.backends.rocm_aiter_fa.AiterFlashAttentionBackend", "vllm.v1.attention.backends.rocm_aiter_fa.AiterFlashAttentionChunkPrefillMetadata", "vllm.v1.attention.backends.rocm_aiter_fa.AiterFlashAttentionDecodeMetadata", "vllm.v1.attention.backends.rocm_aiter_fa.AiterFlashAttentionImpl", "vllm.v1.attention.backends.rocm_aiter_fa.AiterFlashAttentionMetadata", "vllm.v1.attention.backends.rocm_aiter_fa.AiterFlashAttentionMetadataBuilder", "vllm.v1.attention.backends.rocm_aiter_fa.AiterFlashAttentionPrefillMetadata", "vllm.v1.attention.backends.rocm_aiter_fa.block_size", "vllm.v1.attention.backends.rocm_aiter_fa.cp_mha_gather_cache", "vllm.v1.attention.backends.rocm_aiter_fa.cp_mha_gather_cache_kernel", "vllm.v1.attention.backends.rocm_aiter_fa.logger", "vllm.v1.attention.backends.rocm_aiter_fa.num_programs", "vllm.v1.attention.backends.rocm_aiter_fa.reshape_and_cache_shuffle_kernel", "vllm.v1.attention.backends.rocm_aiter_fa.reshape_and_cache_shuffle_triton" ], "n_typable": 171, "n_typed": 106, "n_any": 0, "n_untyped": 65, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 58, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 66, "n_classes": 9, "n_attrs": 78, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/rocm_aiter_unified_attn.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.rocm_aiter_unified_attn.RocmAiterUnifiedAttentionBackend", "methods": [ { "kind": "function", "name": "RocmAiterUnifiedAttentionBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmAiterUnifiedAttentionBackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmAiterUnifiedAttentionBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "RocmAiterUnifiedAttentionBackend.use_cascade_attention", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RocmAiterUnifiedAttentionBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmAiterUnifiedAttentionBackend.supports_attn_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RocmAiterUnifiedAttentionBackend.accept_output_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RocmAiterUnifiedAttentionBackend.forward_includes_kv_cache_update", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 16, "n_typed": 14, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 8, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.rocm_aiter_unified_attn.RocmAiterUnifiedAttentionImpl", "methods": [ { "kind": "function", "name": "RocmAiterUnifiedAttentionImpl.fused_output_quant_supported", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmAiterUnifiedAttentionImpl.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "RocmAiterUnifiedAttentionImpl.forward", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "RocmAiterUnifiedAttentionImpl.do_kv_cache_update", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "RocmAiterUnifiedAttentionImpl.fused_rope_kvcache_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmAiterUnifiedAttentionImpl.do_rope_and_kv_cache_update", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RocmAiterUnifiedAttentionImpl.unified_attention", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 42, "n_typed": 37, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 35, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.rocm_aiter_unified_attn.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.rocm_aiter_unified_attn", "names": [ "vllm.v1.attention.backends.rocm_aiter_unified_attn.RocmAiterUnifiedAttentionBackend", "vllm.v1.attention.backends.rocm_aiter_unified_attn.RocmAiterUnifiedAttentionImpl", "vllm.v1.attention.backends.rocm_aiter_unified_attn.logger" ], "n_typable": 59, "n_typed": 51, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 43, "n_classes": 2, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/rocm_attn.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.rocm_attn.RocmAttentionBackend", "methods": [ { "kind": "function", "name": "RocmAttentionBackend.get_supported_kernel_block_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmAttentionBackend.get_supported_head_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmAttentionBackend.validate_head_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmAttentionBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmAttentionBackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmAttentionBackend.supports_attn_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmAttentionBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "RocmAttentionBackend.use_cascade_attention", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RocmAttentionBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RocmAttentionBackend.accept_output_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionBackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionBackend.forward_includes_kv_cache_update", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 21, "n_typed": 19, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 9, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.rocm_attn.RocmAttentionMetadataBuilder", "methods": [ { "kind": "function", "name": "RocmAttentionMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "RocmAttentionMetadataBuilder.build_for_cudagraph_capture", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmAttentionMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RocmAttentionMetadataBuilder._cudagraph_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionMetadataBuilder.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionMetadataBuilder.num_heads_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionMetadataBuilder.num_heads_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionMetadataBuilder.headdim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 11, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.rocm_attn.RocmAttentionMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RocmAttentionMetadata.num_actual_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RocmAttentionMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RocmAttentionMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RocmAttentionMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RocmAttentionMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RocmAttentionMetadata.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RocmAttentionMetadata.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RocmAttentionMetadata.use_cascade", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RocmAttentionMetadata.common_prefix_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RocmAttentionMetadata.cu_prefix_query_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RocmAttentionMetadata.prefix_kv_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RocmAttentionMetadata.suffix_kv_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RocmAttentionMetadata.scheduler_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RocmAttentionMetadata.prefix_scheduler_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 14, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.rocm_attn.RocmAttentionImpl", "methods": [ { "kind": "function", "name": "RocmAttentionImpl.fused_output_quant_supported", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RocmAttentionImpl.__init__", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "RocmAttentionImpl._forward_encoder_attention", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "RocmAttentionImpl.forward", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "RocmAttentionImpl.do_kv_cache_update", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "RocmAttentionImpl.fused_rope_kvcache_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RocmAttentionImpl.do_rope_and_kv_cache_update", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RocmAttentionImpl.attn_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionImpl.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionImpl.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionImpl.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionImpl.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionImpl.alibi_slopes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionImpl.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionImpl.logits_soft_cap", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionImpl.kv_sharing_target_layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionImpl.num_queries_per_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionImpl.fp8_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionImpl.sinks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RocmAttentionImpl.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 61, "n_typed": 44, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 41, "n_attrs": 13, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.attention.backends.rocm_attn.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.rocm_attn", "names": [ "vllm.v1.attention.backends.rocm_attn.RocmAttentionBackend", "vllm.v1.attention.backends.rocm_attn.RocmAttentionImpl", "vllm.v1.attention.backends.rocm_attn.RocmAttentionMetadata", "vllm.v1.attention.backends.rocm_attn.RocmAttentionMetadataBuilder", "vllm.v1.attention.backends.rocm_attn.logger" ], "n_typable": 99, "n_typed": 74, "n_any": 0, "n_untyped": 25, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 58, "n_classes": 4, "n_attrs": 36, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/short_conv_attn.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.short_conv_attn.ShortConvAttentionBackend", "methods": [ { "kind": "function", "name": "ShortConvAttentionBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ShortConvAttentionBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.short_conv_attn.ShortConvAttentionMetadataBuilder", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ShortConvAttentionMetadataBuilder.metadata_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.short_conv_attn.ShortConvAttentionMetadata", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.short_conv_attn", "names": [ "vllm.v1.attention.backends.short_conv_attn.ShortConvAttentionBackend", "vllm.v1.attention.backends.short_conv_attn.ShortConvAttentionMetadata", "vllm.v1.attention.backends.short_conv_attn.ShortConvAttentionMetadataBuilder" ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_classes": 3, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/tree_attn.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.tree_attn.TreeAttentionMetadataBuilder", "methods": [ { "kind": "function", "name": "TreeAttentionMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "TreeAttentionMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "TreeAttentionMetadataBuilder.build_for_drafting", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TreeAttentionMetadataBuilder.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TreeAttentionMetadataBuilder.tree_attn_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TreeAttentionMetadataBuilder.reorder_batch_threshold", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 11, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 9, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.tree_attn.TreeAttentionBackend", "methods": [ { "kind": "function", "name": "TreeAttentionBackend.get_supported_kernel_block_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TreeAttentionBackend.get_supported_head_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TreeAttentionBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TreeAttentionBackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TreeAttentionBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "TreeAttentionBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TreeAttentionBackend.use_cascade_attention", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TreeAttentionBackend.accept_output_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TreeAttentionBackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 16, "n_typed": 14, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.tree_attn.TreeAttentionMetadata", "methods": [], "properties": [ { "kind": "property", "name": "TreeAttentionMetadata.prefill_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "TreeAttentionMetadata.decode_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "TreeAttentionMetadata.num_actual_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TreeAttentionMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TreeAttentionMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TreeAttentionMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TreeAttentionMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TreeAttentionMetadata.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TreeAttentionMetadata.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TreeAttentionMetadata.num_prefill_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TreeAttentionMetadata.num_decode_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TreeAttentionMetadata.num_prefills", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TreeAttentionMetadata.num_decodes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TreeAttentionMetadata.tree_attn_bias", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TreeAttentionMetadata._cached_prefill_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TreeAttentionMetadata._cached_decode_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 14, "n_properties": 2 }, { "kind": "attr", "name": "vllm.v1.attention.backends.tree_attn.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.tree_attn.TreeAttentionImpl", "methods": [ { "kind": "function", "name": "TreeAttentionImpl.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "TreeAttentionImpl.forward", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TreeAttentionImpl.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TreeAttentionImpl.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TreeAttentionImpl.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TreeAttentionImpl.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TreeAttentionImpl.num_queries_per_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TreeAttentionImpl.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TreeAttentionImpl.kv_sharing_target_layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TreeAttentionImpl.alibi_slopes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TreeAttentionImpl.logits_soft_cap", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TreeAttentionImpl.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 31, "n_typed": 21, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 19, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.tree_attn", "names": [ "vllm.v1.attention.backends.tree_attn.TreeAttentionBackend", "vllm.v1.attention.backends.tree_attn.TreeAttentionImpl", "vllm.v1.attention.backends.tree_attn.TreeAttentionMetadata", "vllm.v1.attention.backends.tree_attn.TreeAttentionMetadataBuilder", "vllm.v1.attention.backends.tree_attn.logger" ], "n_typable": 65, "n_typed": 48, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 35, "n_classes": 4, "n_attrs": 30, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/triton_attn.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.attention.backends.triton_attn.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.attention.backends.triton_attn.MIN_LAUNCH_GRID_SIZE_2D", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.triton_attn.TritonAttentionImpl", "methods": [ { "kind": "function", "name": "TritonAttentionImpl.fused_output_quant_supported", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TritonAttentionImpl.__init__", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "TritonAttentionImpl.forward", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "TritonAttentionImpl._forward_encoder_attention", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "TritonAttentionImpl.do_kv_cache_update", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "TritonAttentionImpl.fused_rope_kvcache_supported", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonAttentionImpl.do_rope_and_kv_cache_update", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TritonAttentionImpl.num_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionImpl.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionImpl.scale", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionImpl.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionImpl.alibi_slopes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionImpl.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionImpl.logits_soft_cap", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionImpl.kv_sharing_target_layer_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionImpl.num_queries_per_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionImpl.attn_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionImpl.fp8_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionImpl.sinks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionImpl.use_alibi_sqrt", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionImpl.supports_quant_query_input", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionImpl.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 64, "n_typed": 45, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 42, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.triton_attn.TritonAttentionMetadataBuilder", "methods": [ { "kind": "function", "name": "TritonAttentionMetadataBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "TritonAttentionMetadataBuilder.build_for_cudagraph_capture", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TritonAttentionMetadataBuilder.build", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TritonAttentionMetadataBuilder._cudagraph_support", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionMetadataBuilder.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionMetadataBuilder.num_heads_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionMetadataBuilder.num_heads_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionMetadataBuilder.headdim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionMetadataBuilder.decode_cudagraph_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionMetadataBuilder.seq_threshold_3D", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionMetadataBuilder.num_par_softmax_segments", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionMetadataBuilder.softmax_segm_output", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionMetadataBuilder.softmax_segm_max", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionMetadataBuilder.softmax_segm_expsum", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 11, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 11, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.triton_attn.TritonAttentionMetadata", "methods": [], "properties": [ { "kind": "property", "name": "TritonAttentionMetadata.mm_prefix_range_tensor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "TritonAttentionMetadata.num_actual_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.max_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.max_seq_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.seq_threshold_3D", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.num_par_softmax_segments", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.softmax_segm_output", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.softmax_segm_max", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.softmax_segm_expsum", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.use_cascade", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.common_prefix_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.cu_prefix_query_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.prefix_kv_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.suffix_kv_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.scheduler_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.prefix_scheduler_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TritonAttentionMetadata.mm_prefix_range", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 20, "n_properties": 1 }, { "kind": "attr", "name": "vllm.v1.attention.backends.triton_attn.NUM_PAR_SOFTMAX_SEGMENTS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.attention.backends.triton_attn.TritonAttentionBackend", "methods": [ { "kind": "function", "name": "TritonAttentionBackend.get_supported_kernel_block_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonAttentionBackend.get_name", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonAttentionBackend.get_impl_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonAttentionBackend.get_kv_cache_shape", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "TritonAttentionBackend.get_kv_cache_stride_order", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TritonAttentionBackend.use_cascade_attention", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "TritonAttentionBackend.get_builder_cls", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonAttentionBackend.supports_head_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TritonAttentionBackend.supports_mm_prefix", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonAttentionBackend.supports_sink", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonAttentionBackend.supports_attn_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TritonAttentionBackend.supports_alibi_sqrt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "TritonAttentionBackend.supports_compute_capability", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TritonAttentionBackend.accept_output_buffer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionBackend.supported_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionBackend.supported_kv_cache_dtypes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "TritonAttentionBackend.forward_includes_kv_cache_update", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 28, "n_typed": 26, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 11, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.triton_attn", "names": [ "vllm.v1.attention.backends.triton_attn.MIN_LAUNCH_GRID_SIZE_2D", "vllm.v1.attention.backends.triton_attn.NUM_PAR_SOFTMAX_SEGMENTS", "vllm.v1.attention.backends.triton_attn.TritonAttentionBackend", "vllm.v1.attention.backends.triton_attn.TritonAttentionImpl", "vllm.v1.attention.backends.triton_attn.TritonAttentionMetadata", "vllm.v1.attention.backends.triton_attn.TritonAttentionMetadataBuilder", "vllm.v1.attention.backends.triton_attn.logger" ], "n_typable": 116, "n_typed": 83, "n_any": 0, "n_untyped": 33, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 23, "n_method_overloads": 23, "n_method_params": 61, "n_classes": 4, "n_attrs": 53, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/backends/utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.backends.utils.KVSharingFastPrefillMetadata", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.reshape_query_for_spec_decode", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.make_kv_sharing_fast_prefill_common_attn_metadata", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.v1.attention.backends.utils.KVCacheLayoutType", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.get_dcp_local_seq_lens", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.split_decodes_and_prefills", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.v1.attention.backends.utils.PAD_SLOT_ID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.reorder_batch_to_split_decodes_and_prefills", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.compute_causal_conv1d_metadata", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.get_per_layer_parameters", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.subclass_attention_metadata", "n_typed": 2, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.make_local_attention_virtual_batches", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.create_fast_prefill_custom_backend", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.reshape_attn_output_for_spec_decode", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.v1.attention.backends.utils.PerLayerParameters", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PerLayerParameters.window_left", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PerLayerParameters.logits_soft_cap", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PerLayerParameters.sm_scale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PerLayerParameters.has_sinks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PerLayerParameters.has_same_window_lefts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PerLayerParameters.has_same_all_params", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.set_kv_cache_layout", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.split_decodes_prefills_and_extends", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.is_valid_kv_cache_layout", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.get_kv_cache_layout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.infer_global_hyperparameters", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.mamba_get_block_table_tensor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.v1.attention.backends.utils.split_prefill_chunks", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.v1.attention.backends.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.attention.backends.utils", "names": [ "vllm.v1.attention.backends.utils.KVCacheLayoutType", "vllm.v1.attention.backends.utils.KVSharingFastPrefillMetadata", "vllm.v1.attention.backends.utils.PAD_SLOT_ID", "vllm.v1.attention.backends.utils.PerLayerParameters", "vllm.v1.attention.backends.utils.compute_causal_conv1d_metadata", "vllm.v1.attention.backends.utils.create_fast_prefill_custom_backend", "vllm.v1.attention.backends.utils.get_dcp_local_seq_lens", "vllm.v1.attention.backends.utils.get_kv_cache_layout", "vllm.v1.attention.backends.utils.get_per_layer_parameters", "vllm.v1.attention.backends.utils.infer_global_hyperparameters", "vllm.v1.attention.backends.utils.is_valid_kv_cache_layout", "vllm.v1.attention.backends.utils.logger", "vllm.v1.attention.backends.utils.make_kv_sharing_fast_prefill_common_attn_metadata", "vllm.v1.attention.backends.utils.make_local_attention_virtual_batches", "vllm.v1.attention.backends.utils.mamba_get_block_table_tensor", "vllm.v1.attention.backends.utils.reorder_batch_to_split_decodes_and_prefills", "vllm.v1.attention.backends.utils.reshape_attn_output_for_spec_decode", "vllm.v1.attention.backends.utils.reshape_query_for_spec_decode", "vllm.v1.attention.backends.utils.set_kv_cache_layout", "vllm.v1.attention.backends.utils.split_decodes_and_prefills", "vllm.v1.attention.backends.utils.split_decodes_prefills_and_extends", "vllm.v1.attention.backends.utils.split_prefill_chunks", "vllm.v1.attention.backends.utils.subclass_attention_metadata" ], "n_typable": 59, "n_typed": 53, "n_any": 2, "n_untyped": 4, "n_functions": 18, "n_function_overloads": 18, "n_function_params": 39, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 2, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/ops/chunked_prefill_paged_decode.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.attention.ops.chunked_prefill_paged_decode.chunked_prefill_paged_decode", "n_typed": 1, "n_any": 0, "n_untyped": 20, "n_overloads": 1, "n_typable": 21, "n_params": 20, "n_function_overloads": 1, "n_function_params": 20 }, { "kind": "function", "name": "vllm.v1.attention.ops.chunked_prefill_paged_decode.cdiv_fn", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.v1.attention.ops.chunked_prefill_paged_decode.float8_info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.attention.ops.chunked_prefill_paged_decode.kernel_paged_attention_2d", "n_typed": 29, "n_any": 0, "n_untyped": 14, "n_overloads": 1, "n_typable": 43, "n_params": 42, "n_function_overloads": 1, "n_function_params": 42 } ], "type_ignores": [], "name": "vllm.v1.attention.ops.chunked_prefill_paged_decode", "names": [ "vllm.v1.attention.ops.chunked_prefill_paged_decode.cdiv_fn", "vllm.v1.attention.ops.chunked_prefill_paged_decode.chunked_prefill_paged_decode", "vllm.v1.attention.ops.chunked_prefill_paged_decode.float8_info", "vllm.v1.attention.ops.chunked_prefill_paged_decode.kernel_paged_attention_2d" ], "n_typable": 68, "n_typed": 30, "n_any": 0, "n_untyped": 38, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 64, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/ops/common.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.attention.ops.common.pack_seq_triton", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.v1.attention.ops.common.CPTritonContext", "methods": [ { "kind": "function", "name": "CPTritonContext.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPTritonContext.call_kernel", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CPTritonContext.inner_kernel", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.ops.common.correct_attn_out", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.v1.attention.ops.common.unpack_seq_triton", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.v1.attention.ops.common.cp_lse_ag_out_ar", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.v1.attention.ops.common.cp_lse_ag_out_rs", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.v1.attention.ops.common", "names": [ "vllm.v1.attention.ops.common.CPTritonContext", "vllm.v1.attention.ops.common.correct_attn_out", "vllm.v1.attention.ops.common.cp_lse_ag_out_ar", "vllm.v1.attention.ops.common.cp_lse_ag_out_rs", "vllm.v1.attention.ops.common.pack_seq_triton", "vllm.v1.attention.ops.common.unpack_seq_triton" ], "n_typable": 38, "n_typed": 27, "n_any": 0, "n_untyped": 11, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 26, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/ops/flashmla.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.attention.ops.flashmla.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.ops.flashmla.FlashMLASchedMeta", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.attention.ops.flashmla.is_flashmla_sparse_supported", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.v1.attention.ops.flashmla.get_mla_metadata_dense_fp8", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.attention.ops.flashmla.flash_mla_with_kvcache_fp8", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "vllm.v1.attention.ops.flashmla.is_flashmla_dense_supported", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [ { "kind": "type", "rules": [ "no-redef" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] } ], "name": "vllm.v1.attention.ops.flashmla", "names": [ "vllm.v1.attention.ops.flashmla.FlashMLASchedMeta", "vllm.v1.attention.ops.flashmla.flash_mla_with_kvcache_fp8", "vllm.v1.attention.ops.flashmla.get_mla_metadata_dense_fp8", "vllm.v1.attention.ops.flashmla.is_flashmla_dense_supported", "vllm.v1.attention.ops.flashmla.is_flashmla_sparse_supported", "vllm.v1.attention.ops.flashmla.logger" ], "n_typable": 19, "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 14, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 7 }, { "path": "vllm/v1/attention/ops/merge_attn_states.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.attention.ops.merge_attn_states.merge_attn_states", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.v1.attention.ops.merge_attn_states", "names": [ "vllm.v1.attention.ops.merge_attn_states.merge_attn_states" ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/ops/paged_attn.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.attention.ops.paged_attn.PagedAttention", "methods": [ { "kind": "function", "name": "PagedAttention.split_kv_cache", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PagedAttention.write_to_paged_cache", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [], "attrs": [], "n_typable": 13, "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": [ "no-redef" ] } ], "name": "vllm.v1.attention.ops.paged_attn", "names": [ "vllm.v1.attention.ops.paged_attn.PagedAttention" ], "n_typable": 13, "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/v1/attention/ops/prefix_prefill.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.attention.ops.prefix_prefill.NUM_WARPS", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.attention.ops.prefix_prefill.float8_info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.attention.ops.prefix_prefill.BASE_BLOCK", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.attention.ops.prefix_prefill.context_attention_fwd", "n_typed": 4, "n_any": 0, "n_untyped": 18, "n_overloads": 1, "n_typable": 22, "n_params": 21, "n_function_overloads": 1, "n_function_params": 21 }, { "kind": "attr", "name": "vllm.v1.attention.ops.prefix_prefill.IS_TURING", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.attention.ops.prefix_prefill", "names": [ "vllm.v1.attention.ops.prefix_prefill.BASE_BLOCK", "vllm.v1.attention.ops.prefix_prefill.IS_TURING", "vllm.v1.attention.ops.prefix_prefill.NUM_WARPS", "vllm.v1.attention.ops.prefix_prefill.context_attention_fwd", "vllm.v1.attention.ops.prefix_prefill.float8_info" ], "n_typable": 26, "n_typed": 4, "n_any": 0, "n_untyped": 22, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 21, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/ops/rocm_aiter_mla_sparse.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.attention.ops.rocm_aiter_mla_sparse.rocm_fp8_paged_mqa_logits", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.v1.attention.ops.rocm_aiter_mla_sparse.cp_gather_indexer_k_quant_cache_triton", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.v1.attention.ops.rocm_aiter_mla_sparse.rocm_aiter_sparse_attn_indexer", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "vllm.v1.attention.ops.rocm_aiter_mla_sparse.fp8_paged_mqa_logits_torch", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.v1.attention.ops.rocm_aiter_mla_sparse.indexer_k_quant_and_cache_triton", "n_typed": 3, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.v1.attention.ops.rocm_aiter_mla_sparse.rocm_fp8_mqa_logits", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.v1.attention.ops.rocm_aiter_mla_sparse.fp8_mqa_logits_torch", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.v1.attention.ops.rocm_aiter_mla_sparse.rocm_aiter_sparse_attn_indexer_fake", "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 } ], "type_ignores": [], "name": "vllm.v1.attention.ops.rocm_aiter_mla_sparse", "names": [ "vllm.v1.attention.ops.rocm_aiter_mla_sparse.cp_gather_indexer_k_quant_cache_triton", "vllm.v1.attention.ops.rocm_aiter_mla_sparse.fp8_mqa_logits_torch", "vllm.v1.attention.ops.rocm_aiter_mla_sparse.fp8_paged_mqa_logits_torch", "vllm.v1.attention.ops.rocm_aiter_mla_sparse.indexer_k_quant_and_cache_triton", "vllm.v1.attention.ops.rocm_aiter_mla_sparse.rocm_aiter_sparse_attn_indexer", "vllm.v1.attention.ops.rocm_aiter_mla_sparse.rocm_aiter_sparse_attn_indexer_fake", "vllm.v1.attention.ops.rocm_aiter_mla_sparse.rocm_fp8_mqa_logits", "vllm.v1.attention.ops.rocm_aiter_mla_sparse.rocm_fp8_paged_mqa_logits" ], "n_typable": 72, "n_typed": 65, "n_any": 0, "n_untyped": 7, "n_functions": 8, "n_function_overloads": 8, "n_function_params": 64, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/ops/triton_decode_attention.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.attention.ops.triton_decode_attention.decode_attention_fwd", "n_typed": 0, "n_any": 0, "n_untyped": 13, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "attr", "name": "vllm.v1.attention.ops.triton_decode_attention.is_hip_", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.attention.ops.triton_decode_attention.decode_attention_fwd_grouped", "n_typed": 0, "n_any": 0, "n_untyped": 13, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "attr", "name": "vllm.v1.attention.ops.triton_decode_attention.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.attention.ops.triton_decode_attention.decode_attention_fwd_normal", "n_typed": 0, "n_any": 0, "n_untyped": 13, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "vllm.v1.attention.ops.triton_decode_attention.tanh", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.v1.attention.ops.triton_decode_attention", "names": [ "vllm.v1.attention.ops.triton_decode_attention.decode_attention_fwd", "vllm.v1.attention.ops.triton_decode_attention.decode_attention_fwd_grouped", "vllm.v1.attention.ops.triton_decode_attention.decode_attention_fwd_normal", "vllm.v1.attention.ops.triton_decode_attention.is_hip_", "vllm.v1.attention.ops.triton_decode_attention.logger", "vllm.v1.attention.ops.triton_decode_attention.tanh" ], "n_typable": 43, "n_typed": 0, "n_any": 0, "n_untyped": 43, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 37, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/ops/triton_merge_attn_states.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.attention.ops.triton_merge_attn_states.merge_attn_states_kernel", "n_typed": 3, "n_any": 0, "n_untyped": 9, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "vllm.v1.attention.ops.triton_merge_attn_states.merge_attn_states", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.v1.attention.ops.triton_merge_attn_states", "names": [ "vllm.v1.attention.ops.triton_merge_attn_states.merge_attn_states", "vllm.v1.attention.ops.triton_merge_attn_states.merge_attn_states_kernel" ], "n_typable": 19, "n_typed": 10, "n_any": 0, "n_untyped": 9, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 17, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/ops/triton_prefill_attention.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.attention.ops.triton_prefill_attention.context_attention_fwd", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "vllm.v1.attention.ops.triton_prefill_attention.get_block_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.v1.attention.ops.triton_prefill_attention", "names": [ "vllm.v1.attention.ops.triton_prefill_attention.context_attention_fwd", "vllm.v1.attention.ops.triton_prefill_attention.get_block_size" ], "n_typable": 14, "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 12, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/ops/triton_reshape_and_cache_flash.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.attention.ops.triton_reshape_and_cache_flash.reshape_and_cache_kernel_flash", "n_typed": 14, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 22, "n_params": 21, "n_function_overloads": 1, "n_function_params": 21 }, { "kind": "function", "name": "vllm.v1.attention.ops.triton_reshape_and_cache_flash.triton_reshape_and_cache_flash", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.v1.attention.ops.triton_reshape_and_cache_flash.reshape_and_cache_kernel_flash_diffkv", "n_typed": 10, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "vllm.v1.attention.ops.triton_reshape_and_cache_flash.triton_reshape_and_cache_flash_diffkv", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "type_ignores": [], "name": "vllm.v1.attention.ops.triton_reshape_and_cache_flash", "names": [ "vllm.v1.attention.ops.triton_reshape_and_cache_flash.reshape_and_cache_kernel_flash", "vllm.v1.attention.ops.triton_reshape_and_cache_flash.reshape_and_cache_kernel_flash_diffkv", "vllm.v1.attention.ops.triton_reshape_and_cache_flash.triton_reshape_and_cache_flash", "vllm.v1.attention.ops.triton_reshape_and_cache_flash.triton_reshape_and_cache_flash_diffkv" ], "n_typable": 56, "n_typed": 39, "n_any": 0, "n_untyped": 17, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 52, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/ops/triton_unified_attention.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.attention.ops.triton_unified_attention.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.attention.ops.triton_unified_attention.kernel_unified_attention_3d", "n_typed": 30, "n_any": 0, "n_untyped": 18, "n_overloads": 1, "n_typable": 48, "n_params": 47, "n_function_overloads": 1, "n_function_params": 47 }, { "kind": "attr", "name": "vllm.v1.attention.ops.triton_unified_attention.is_batch_invariant", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.attention.ops.triton_unified_attention.cdiv_fn", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.v1.attention.ops.triton_unified_attention.float8_info", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.attention.ops.triton_unified_attention.apply_softcap", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.attention.ops.triton_unified_attention.find_seq_idx", "n_typed": 2, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.v1.attention.ops.triton_unified_attention.unified_attention", "n_typed": 0, "n_any": 0, "n_untyped": 28, "n_overloads": 1, "n_typable": 28, "n_params": 27, "n_function_overloads": 1, "n_function_params": 27 }, { "kind": "function", "name": "vllm.v1.attention.ops.triton_unified_attention.kernel_unified_attention_2d", "n_typed": 34, "n_any": 0, "n_untyped": 17, "n_overloads": 1, "n_typable": 51, "n_params": 50, "n_function_overloads": 1, "n_function_params": 50 }, { "kind": "function", "name": "vllm.v1.attention.ops.triton_unified_attention.reduce_segments", "n_typed": 12, "n_any": 0, "n_untyped": 9, "n_overloads": 1, "n_typable": 21, "n_params": 20, "n_function_overloads": 1, "n_function_params": 20 } ], "type_ignores": [], "name": "vllm.v1.attention.ops.triton_unified_attention", "names": [ "vllm.v1.attention.ops.triton_unified_attention.apply_softcap", "vllm.v1.attention.ops.triton_unified_attention.cdiv_fn", "vllm.v1.attention.ops.triton_unified_attention.find_seq_idx", "vllm.v1.attention.ops.triton_unified_attention.float8_info", "vllm.v1.attention.ops.triton_unified_attention.is_batch_invariant", "vllm.v1.attention.ops.triton_unified_attention.kernel_unified_attention_2d", "vllm.v1.attention.ops.triton_unified_attention.kernel_unified_attention_3d", "vllm.v1.attention.ops.triton_unified_attention.logger", "vllm.v1.attention.ops.triton_unified_attention.reduce_segments", "vllm.v1.attention.ops.triton_unified_attention.unified_attention" ], "n_typable": 163, "n_typed": 78, "n_any": 0, "n_untyped": 85, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 153, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/ops/vit_attn_wrappers.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.attention.ops.vit_attn_wrappers.vit_triton_attn_wrapper", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.v1.attention.ops.vit_attn_wrappers.flash_attn_maxseqlen_wrapper", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.v1.attention.ops.vit_attn_wrappers.vit_torch_sdpa_wrapper", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.v1.attention.ops.vit_attn_wrappers.torch_sdpa_wrapper_fake", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.v1.attention.ops.vit_attn_wrappers.flash_attn_maxseqlen_wrapper_fake", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.v1.attention.ops.vit_attn_wrappers.triton_attn_wrapper_fake", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.v1.attention.ops.vit_attn_wrappers.vit_flash_attn_wrapper", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.v1.attention.ops.vit_attn_wrappers.vit_flashinfer_wrapper_fake", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.v1.attention.ops.vit_attn_wrappers.apply_sdpa", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.v1.attention.ops.vit_attn_wrappers.torch_sdpa_wrapper", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.v1.attention.ops.vit_attn_wrappers.triton_attn_wrapper", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.v1.attention.ops.vit_attn_wrappers.vit_flashinfer_wrapper", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.v1.attention.ops.vit_attn_wrappers.flashinfer_wrapper", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "type_ignores": [], "name": "vllm.v1.attention.ops.vit_attn_wrappers", "names": [ "vllm.v1.attention.ops.vit_attn_wrappers.apply_sdpa", "vllm.v1.attention.ops.vit_attn_wrappers.flash_attn_maxseqlen_wrapper", "vllm.v1.attention.ops.vit_attn_wrappers.flash_attn_maxseqlen_wrapper_fake", "vllm.v1.attention.ops.vit_attn_wrappers.flashinfer_wrapper", "vllm.v1.attention.ops.vit_attn_wrappers.torch_sdpa_wrapper", "vllm.v1.attention.ops.vit_attn_wrappers.torch_sdpa_wrapper_fake", "vllm.v1.attention.ops.vit_attn_wrappers.triton_attn_wrapper", "vllm.v1.attention.ops.vit_attn_wrappers.triton_attn_wrapper_fake", "vllm.v1.attention.ops.vit_attn_wrappers.vit_flash_attn_wrapper", "vllm.v1.attention.ops.vit_attn_wrappers.vit_flashinfer_wrapper", "vllm.v1.attention.ops.vit_attn_wrappers.vit_flashinfer_wrapper_fake", "vllm.v1.attention.ops.vit_attn_wrappers.vit_torch_sdpa_wrapper", "vllm.v1.attention.ops.vit_attn_wrappers.vit_triton_attn_wrapper" ], "n_typable": 108, "n_typed": 108, "n_any": 0, "n_untyped": 0, "n_functions": 13, "n_function_overloads": 13, "n_function_params": 95, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/attention/selector.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.attention.selector.get_attn_backend", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "vllm.v1.attention.selector.get_mamba_attn_backend", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.v1.attention.selector.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.attention.selector.AttentionSelectorConfig", "methods": [ { "kind": "function", "name": "AttentionSelectorConfig.__repr__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AttentionSelectorConfig.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionSelectorConfig.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionSelectorConfig.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionSelectorConfig.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionSelectorConfig.use_mla", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionSelectorConfig.has_sink", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionSelectorConfig.use_sparse", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionSelectorConfig.use_mm_prefix", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionSelectorConfig.use_per_head_quant_scales", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionSelectorConfig.attn_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 10, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.attention.selector", "names": [ "vllm.v1.attention.selector.AttentionSelectorConfig", "vllm.v1.attention.selector.get_attn_backend", "vllm.v1.attention.selector.get_mamba_attn_backend", "vllm.v1.attention.selector.logger" ], "n_typable": 16, "n_typed": 14, "n_any": 0, "n_untyped": 2, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 12, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_classes": 1, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/core/block_pool.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.core.block_pool.BlockPool", "methods": [ { "kind": "function", "name": "BlockPool.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BlockPool.get_cached_block", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BlockPool.cache_full_blocks", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "BlockPool.get_new_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BlockPool._maybe_evict_cached_block", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BlockPool.touch", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BlockPool.free_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BlockPool.evict_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BlockPool.reset_prefix_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BlockPool.get_num_free_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BlockPool.get_usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BlockPool.take_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlockPool.num_gpu_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockPool.enable_caching", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockPool.hash_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockPool.blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BlockPool.free_block_queue", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockPool.cached_block_hash_to_block", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BlockPool.null_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockPool.enable_kv_cache_events", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockPool.kv_event_queue", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BlockPool.metrics_collector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 32, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 18, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.core.block_pool.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.core.block_pool.BlockHashToBlockMap", "methods": [ { "kind": "function", "name": "BlockHashToBlockMap.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BlockHashToBlockMap.get_one_block", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BlockHashToBlockMap.insert", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BlockHashToBlockMap.pop", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BlockHashToBlockMap.__len__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BlockHashToBlockMap._unexpected_blocks_type", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 10, "n_any": 1, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.core.block_pool", "names": [ "vllm.v1.core.block_pool.BlockHashToBlockMap", "vllm.v1.core.block_pool.BlockPool", "vllm.v1.core.block_pool.logger" ], "n_typable": 53, "n_typed": 42, "n_any": 1, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 24, "n_classes": 2, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/core/encoder_cache_manager.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.core.encoder_cache_manager.compute_mm_encoder_budget", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.v1.core.encoder_cache_manager.EncoderDecoderCacheManager", "methods": [ { "kind": "function", "name": "EncoderDecoderCacheManager.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EncoderDecoderCacheManager.reset", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EncoderDecoderCacheManager.check_and_update_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EncoderDecoderCacheManager.can_allocate", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EncoderDecoderCacheManager.allocate", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EncoderDecoderCacheManager.free", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EncoderDecoderCacheManager.get_cached_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EncoderDecoderCacheManager.get_freed_mm_hashes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EncoderDecoderCacheManager.free_encoder_input", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EncoderDecoderCacheManager.cache_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderDecoderCacheManager.num_free_slots", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderDecoderCacheManager.allocated", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EncoderDecoderCacheManager.to_free", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 26, "n_typed": 23, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 13, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.core.encoder_cache_manager.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.core.encoder_cache_manager.EncoderCacheManager", "methods": [ { "kind": "function", "name": "EncoderCacheManager.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EncoderCacheManager.reset", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EncoderCacheManager.check_and_update_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EncoderCacheManager.can_allocate", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EncoderCacheManager.allocate", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EncoderCacheManager.get_cached_input_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EncoderCacheManager.free_encoder_input", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EncoderCacheManager.free", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EncoderCacheManager.get_freed_mm_hashes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EncoderCacheManager.cache_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderCacheManager.num_free_slots", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderCacheManager.num_freeable_slots", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderCacheManager.cached", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EncoderCacheManager.freeable", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EncoderCacheManager.freed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 28, "n_typed": 24, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 13, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.core.encoder_cache_manager", "names": [ "vllm.v1.core.encoder_cache_manager.EncoderCacheManager", "vllm.v1.core.encoder_cache_manager.EncoderDecoderCacheManager", "vllm.v1.core.encoder_cache_manager.compute_mm_encoder_budget", "vllm.v1.core.encoder_cache_manager.logger" ], "n_typable": 58, "n_typed": 50, "n_any": 0, "n_untyped": 8, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 26, "n_classes": 2, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/core/kv_cache_coordinator.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.core.kv_cache_coordinator.get_kv_cache_coordinator", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "class", "name": "vllm.v1.core.kv_cache_coordinator.UnitaryKVCacheCoordinator", "methods": [ { "kind": "function", "name": "UnitaryKVCacheCoordinator.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "UnitaryKVCacheCoordinator.find_longest_cache_hit", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "UnitaryKVCacheCoordinator.kv_cache_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UnitaryKVCacheCoordinator.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UnitaryKVCacheCoordinator.dcp_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UnitaryKVCacheCoordinator.pcp_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 11, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.core.kv_cache_coordinator.KVCacheCoordinator", "methods": [ { "kind": "function", "name": "KVCacheCoordinator.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "KVCacheCoordinator.get_num_blocks_to_allocate", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "KVCacheCoordinator.allocate_new_computed_blocks", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KVCacheCoordinator.allocate_new_blocks", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "KVCacheCoordinator.cache_blocks", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KVCacheCoordinator.free", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheCoordinator.get_num_common_prefix_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheCoordinator.remove_skipped_blocks", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KVCacheCoordinator.get_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheCoordinator.find_longest_cache_hit", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KVCacheCoordinator.new_step_starts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KVCacheCoordinator.kv_cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheCoordinator.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheCoordinator.enable_caching", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheCoordinator.block_pool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheCoordinator.use_eagle", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheCoordinator.single_type_managers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 49, "n_typed": 42, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 32, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.core.kv_cache_coordinator.KVCacheCoordinatorNoPrefixCache", "methods": [ { "kind": "function", "name": "KVCacheCoordinatorNoPrefixCache.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "KVCacheCoordinatorNoPrefixCache.get_num_common_prefix_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheCoordinatorNoPrefixCache.find_longest_cache_hit", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KVCacheCoordinatorNoPrefixCache.num_single_type_manager", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 13, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.core.kv_cache_coordinator.HybridKVCacheCoordinator", "methods": [ { "kind": "function", "name": "HybridKVCacheCoordinator.__init__", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "HybridKVCacheCoordinator.verify_and_split_kv_cache_groups", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "HybridKVCacheCoordinator.find_longest_cache_hit", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "HybridKVCacheCoordinator.hash_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 13, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 11, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.core.kv_cache_coordinator", "names": [ "vllm.v1.core.kv_cache_coordinator.HybridKVCacheCoordinator", "vllm.v1.core.kv_cache_coordinator.KVCacheCoordinator", "vllm.v1.core.kv_cache_coordinator.KVCacheCoordinatorNoPrefixCache", "vllm.v1.core.kv_cache_coordinator.UnitaryKVCacheCoordinator", "vllm.v1.core.kv_cache_coordinator.get_kv_cache_coordinator" ], "n_typable": 106, "n_typed": 90, "n_any": 0, "n_untyped": 16, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 9, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 65, "n_classes": 4, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/core/kv_cache_manager.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.core.kv_cache_manager.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.core.kv_cache_manager.KVCacheManager", "methods": [ { "kind": "function", "name": "KVCacheManager.__init__", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "KVCacheManager.make_prefix_cache_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVCacheManager.get_computed_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheManager.allocate_slots", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "KVCacheManager.free", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheManager.remove_skipped_blocks", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KVCacheManager.evict_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheManager.reset_prefix_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVCacheManager.get_num_common_prefix_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheManager.take_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVCacheManager.get_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheManager.get_block_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheManager.cache_blocks", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KVCacheManager.create_kv_cache_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheManager.take_new_block_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVCacheManager.new_step_starts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "KVCacheManager.usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "KVCacheManager.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheManager.enable_caching", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheManager.use_eagle", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheManager.log_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheManager.metrics_collector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheManager.prefix_cache_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheManager.coordinator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheManager.num_kv_cache_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheManager.block_pool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheManager.kv_cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheManager.empty_kv_cache_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 57, "n_typed": 46, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 29, "n_attrs": 11, "n_properties": 1 }, { "kind": "class", "name": "vllm.v1.core.kv_cache_manager.KVCacheBlocks", "methods": [ { "kind": "function", "name": "KVCacheBlocks.__add__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheBlocks.get_block_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheBlocks.get_unhashed_block_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVCacheBlocks.new_empty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KVCacheBlocks.blocks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 5, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.core.kv_cache_manager", "names": [ "vllm.v1.core.kv_cache_manager.KVCacheBlocks", "vllm.v1.core.kv_cache_manager.KVCacheManager", "vllm.v1.core.kv_cache_manager.logger" ], "n_typable": 64, "n_typed": 52, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 20, "n_method_overloads": 21, "n_method_params": 31, "n_classes": 2, "n_attrs": 13, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/core/kv_cache_metrics.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.core.kv_cache_metrics.KVCacheMetricsCollector", "methods": [ { "kind": "function", "name": "KVCacheMetricsCollector.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheMetricsCollector.should_sample_block", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVCacheMetricsCollector.on_block_allocated", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheMetricsCollector.on_block_accessed", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheMetricsCollector.on_block_evicted", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheMetricsCollector.reset", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVCacheMetricsCollector.drain_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KVCacheMetricsCollector.sample_rate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVCacheMetricsCollector.block_metrics", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 13, "n_typed": 11, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.core.kv_cache_metrics.BlockMetricsState", "methods": [ { "kind": "function", "name": "BlockMetricsState.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BlockMetricsState.record_access", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BlockMetricsState.get_lifetime_seconds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BlockMetricsState.get_idle_time_seconds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BlockMetricsState.get_reuse_gaps_seconds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlockMetricsState.birth_time_ns", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockMetricsState.last_access_ns", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockMetricsState.access_history", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.core.kv_cache_metrics", "names": [ "vllm.v1.core.kv_cache_metrics.BlockMetricsState", "vllm.v1.core.kv_cache_metrics.KVCacheMetricsCollector" ], "n_typable": 21, "n_typed": 16, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 4, "n_classes": 2, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/core/kv_cache_utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.core.kv_cache_utils.BlockHashWithGroupId", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.need_extra_keys", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.get_kv_cache_config_from_groups", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.v1.core.kv_cache_utils.KVCacheBlock", "methods": [ { "kind": "function", "name": "KVCacheBlock.reset_hash", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVCacheBlock.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "KVCacheBlock.block_hash", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_typable": 2 } ], "attrs": [ { "kind": "attr", "name": "KVCacheBlock.block_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVCacheBlock.ref_cnt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVCacheBlock._block_hash", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVCacheBlock.prev_free_block", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVCacheBlock.next_free_block", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVCacheBlock.is_null", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 6, "n_properties": 1 }, { "kind": "attr", "name": "vllm.v1.core.kv_cache_utils.ExternalBlockHash", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.core.kv_cache_utils.BlockHashList", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.may_override_num_blocks", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.is_kv_cache_spec_uniform", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.generate_scheduler_kv_cache_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.estimate_max_model_len", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.create_kv_cache_group_specs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.max_memory_usage_bytes", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.v1.core.kv_cache_utils.BlockHashListWithBlockSize", "methods": [ { "kind": "function", "name": "BlockHashListWithBlockSize.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BlockHashListWithBlockSize.__len__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BlockHashListWithBlockSize.__getitem__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 2, "n_params": 1, "n_function_overloads": 2, "n_function_params": 1 }, { "kind": "function", "name": "BlockHashListWithBlockSize.__iter__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BlockHashListWithBlockSize._get_value_at", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlockHashListWithBlockSize.block_hashes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockHashListWithBlockSize.scale_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 6, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.is_kv_cache_page_size_uniform", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.v1.core.kv_cache_utils.NONE_HASH", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.make_block_hash_with_group_id", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.get_request_block_hasher", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.generate_block_hash_extra_keys", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.maybe_convert_block_hash", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.get_kv_cache_groups", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "attr", "name": "vllm.v1.core.kv_cache_utils.BlockHash", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.unify_hybrid_kv_cache_specs", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.get_uniform_page_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.get_num_blocks", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.get_block_hash", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.unify_kv_cache_spec_page_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.get_group_id", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.check_enough_kv_cache_memory", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.is_kv_cache_type_attention_free", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.v1.core.kv_cache_utils.FreeKVCacheBlockQueue", "methods": [ { "kind": "function", "name": "FreeKVCacheBlockQueue.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FreeKVCacheBlockQueue.popleft", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FreeKVCacheBlockQueue.popleft_n", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FreeKVCacheBlockQueue.remove", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FreeKVCacheBlockQueue.append", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FreeKVCacheBlockQueue.append_n", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FreeKVCacheBlockQueue.get_all_free_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FreeKVCacheBlockQueue.num_free_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FreeKVCacheBlockQueue.fake_free_list_head", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FreeKVCacheBlockQueue.fake_free_list_tail", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 12, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 5, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.init_none_hash", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.hash_block_tokens", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.v1.core.kv_cache_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.get_kv_cache_configs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.core.kv_cache_utils.get_max_concurrency_for_kv_cache_config", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.v1.core.kv_cache_utils", "names": [ "vllm.v1.core.kv_cache_utils.BlockHash", "vllm.v1.core.kv_cache_utils.BlockHashList", "vllm.v1.core.kv_cache_utils.BlockHashListWithBlockSize", "vllm.v1.core.kv_cache_utils.BlockHashWithGroupId", "vllm.v1.core.kv_cache_utils.ExternalBlockHash", "vllm.v1.core.kv_cache_utils.FreeKVCacheBlockQueue", "vllm.v1.core.kv_cache_utils.KVCacheBlock", "vllm.v1.core.kv_cache_utils.NONE_HASH", "vllm.v1.core.kv_cache_utils.check_enough_kv_cache_memory", "vllm.v1.core.kv_cache_utils.create_kv_cache_group_specs", "vllm.v1.core.kv_cache_utils.estimate_max_model_len", "vllm.v1.core.kv_cache_utils.generate_block_hash_extra_keys", "vllm.v1.core.kv_cache_utils.generate_scheduler_kv_cache_config", "vllm.v1.core.kv_cache_utils.get_block_hash", "vllm.v1.core.kv_cache_utils.get_group_id", "vllm.v1.core.kv_cache_utils.get_kv_cache_config_from_groups", "vllm.v1.core.kv_cache_utils.get_kv_cache_configs", "vllm.v1.core.kv_cache_utils.get_kv_cache_groups", "vllm.v1.core.kv_cache_utils.get_max_concurrency_for_kv_cache_config", "vllm.v1.core.kv_cache_utils.get_num_blocks", "vllm.v1.core.kv_cache_utils.get_request_block_hasher", "vllm.v1.core.kv_cache_utils.get_uniform_page_size", "vllm.v1.core.kv_cache_utils.hash_block_tokens", "vllm.v1.core.kv_cache_utils.init_none_hash", "vllm.v1.core.kv_cache_utils.is_kv_cache_page_size_uniform", "vllm.v1.core.kv_cache_utils.is_kv_cache_spec_uniform", "vllm.v1.core.kv_cache_utils.is_kv_cache_type_attention_free", "vllm.v1.core.kv_cache_utils.logger", "vllm.v1.core.kv_cache_utils.make_block_hash_with_group_id", "vllm.v1.core.kv_cache_utils.max_memory_usage_bytes", "vllm.v1.core.kv_cache_utils.may_override_num_blocks", "vllm.v1.core.kv_cache_utils.maybe_convert_block_hash", "vllm.v1.core.kv_cache_utils.need_extra_keys", "vllm.v1.core.kv_cache_utils.unify_hybrid_kv_cache_specs", "vllm.v1.core.kv_cache_utils.unify_kv_cache_spec_page_size" ], "n_typable": 110, "n_typed": 99, "n_any": 0, "n_untyped": 11, "n_functions": 26, "n_function_overloads": 26, "n_function_params": 50, "n_methods": 14, "n_method_overloads": 15, "n_method_params": 10, "n_classes": 3, "n_attrs": 17, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/core/sched/async_scheduler.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.core.sched.async_scheduler.AsyncScheduler", "methods": [ { "kind": "function", "name": "AsyncScheduler.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncScheduler._update_after_schedule", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncScheduler._update_request_with_output", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.core.sched.async_scheduler.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.core.sched.async_scheduler", "names": [ "vllm.v1.core.sched.async_scheduler.AsyncScheduler", "vllm.v1.core.sched.async_scheduler.logger" ], "n_typable": 9, "n_typed": 6, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/core/sched/interface.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.core.sched.interface.PauseState", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PauseState.UNPAUSED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PauseState.PAUSED_NEW", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PauseState.PAUSED_ALL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.core.sched.interface.SchedulerInterface", "methods": [ { "kind": "function", "name": "SchedulerInterface.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "SchedulerInterface.schedule", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SchedulerInterface.get_grammar_bitmask", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SchedulerInterface.update_from_output", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SchedulerInterface.update_draft_token_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SchedulerInterface.update_draft_token_ids_in_output", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SchedulerInterface.add_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SchedulerInterface.finish_requests", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SchedulerInterface.get_num_unfinished_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SchedulerInterface.has_unfinished_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SchedulerInterface.has_finished_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SchedulerInterface.has_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SchedulerInterface.set_pause_state", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SchedulerInterface.reset_prefix_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SchedulerInterface.reset_encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SchedulerInterface.get_request_counts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SchedulerInterface.make_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SchedulerInterface.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SchedulerInterface.get_kv_connector", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "SchedulerInterface.pause_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 39, "n_typed": 39, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 19, "n_attrs": 0, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.v1.core.sched.interface", "names": [ "vllm.v1.core.sched.interface.PauseState", "vllm.v1.core.sched.interface.SchedulerInterface" ], "n_typable": 39, "n_typed": 39, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 19, "n_classes": 2, "n_attrs": 3, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/core/sched/output.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.core.sched.output.KVConnectorMetadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.core.sched.output.ECConnectorMetadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.core.sched.output.NewRequestData", "methods": [ { "kind": "function", "name": "NewRequestData.from_request", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "NewRequestData.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "NewRequestData.anon_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NewRequestData.req_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NewRequestData.prompt_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NewRequestData.mm_features", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NewRequestData.sampling_params", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NewRequestData.pooling_params", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NewRequestData.block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NewRequestData.num_computed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NewRequestData.lora_request", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NewRequestData.prompt_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NewRequestData.prefill_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.core.sched.output.PoolingParams", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.core.sched.output.LoRARequest", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.core.sched.output.SamplingParams", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.core.sched.output.MultiModalFeatureSpec", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.core.sched.output.CachedRequestData", "methods": [ { "kind": "function", "name": "CachedRequestData.anon_repr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CachedRequestData.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CachedRequestData.is_context_phase", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CachedRequestData.make_empty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "CachedRequestData.num_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "CachedRequestData._req_id_to_num_output_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "CachedRequestData.req_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestData.resumed_req_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestData.new_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestData.all_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestData.new_block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestData.num_computed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestData.num_output_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 1, "n_attrs": 7, "n_properties": 2 }, { "kind": "class", "name": "vllm.v1.core.sched.output.SchedulerOutput", "methods": [ { "kind": "function", "name": "SchedulerOutput.make_empty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SchedulerOutput.scheduled_new_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerOutput.scheduled_cached_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerOutput.num_scheduled_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerOutput.total_num_scheduled_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerOutput.scheduled_spec_decode_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerOutput.scheduled_encoder_inputs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerOutput.num_common_prefix_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerOutput.finished_req_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerOutput.free_encoder_mm_hashes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerOutput.preempted_req_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerOutput.has_structured_output_requests", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerOutput.pending_structured_output_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerOutput.num_invalid_spec_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerOutput.kv_connector_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerOutput.ec_connector_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerOutput.new_block_ids_to_zero", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 16, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.core.sched.output.Request", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.core.sched.output.GrammarOutput", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "GrammarOutput.structured_output_request_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GrammarOutput.grammar_bitmask", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.core.sched.output", "names": [ "vllm.v1.core.sched.output.CachedRequestData", "vllm.v1.core.sched.output.ECConnectorMetadata", "vllm.v1.core.sched.output.GrammarOutput", "vllm.v1.core.sched.output.KVConnectorMetadata", "vllm.v1.core.sched.output.LoRARequest", "vllm.v1.core.sched.output.MultiModalFeatureSpec", "vllm.v1.core.sched.output.NewRequestData", "vllm.v1.core.sched.output.PoolingParams", "vllm.v1.core.sched.output.Request", "vllm.v1.core.sched.output.SamplingParams", "vllm.v1.core.sched.output.SchedulerOutput" ], "n_typable": 14, "n_typed": 14, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 4, "n_classes": 4, "n_attrs": 42, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/v1/core/sched/request_queue.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.core.sched.request_queue.PriorityRequestQueue", "methods": [ { "kind": "function", "name": "PriorityRequestQueue.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PriorityRequestQueue.add_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PriorityRequestQueue.pop_request", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PriorityRequestQueue.peek_request", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PriorityRequestQueue.prepend_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PriorityRequestQueue.prepend_requests", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PriorityRequestQueue.remove_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PriorityRequestQueue.remove_requests", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PriorityRequestQueue.__bool__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PriorityRequestQueue.__len__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PriorityRequestQueue.__iter__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.core.sched.request_queue.FCFSRequestQueue", "methods": [ { "kind": "function", "name": "FCFSRequestQueue.add_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FCFSRequestQueue.pop_request", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FCFSRequestQueue.peek_request", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FCFSRequestQueue.prepend_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FCFSRequestQueue.prepend_requests", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FCFSRequestQueue.remove_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FCFSRequestQueue.remove_requests", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FCFSRequestQueue.__bool__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FCFSRequestQueue.__len__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FCFSRequestQueue.__iter__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 15, "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.core.sched.request_queue.RequestQueue", "methods": [ { "kind": "function", "name": "RequestQueue.add_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RequestQueue.pop_request", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RequestQueue.peek_request", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RequestQueue.prepend_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RequestQueue.prepend_requests", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RequestQueue.remove_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RequestQueue.remove_requests", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RequestQueue.__bool__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RequestQueue.__len__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RequestQueue.__iter__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 15, "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.core.sched.request_queue.create_request_queue", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.v1.core.sched.request_queue.SchedulingPolicy", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SchedulingPolicy.FCFS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulingPolicy.PRIORITY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.core.sched.request_queue", "names": [ "vllm.v1.core.sched.request_queue.FCFSRequestQueue", "vllm.v1.core.sched.request_queue.PriorityRequestQueue", "vllm.v1.core.sched.request_queue.RequestQueue", "vllm.v1.core.sched.request_queue.SchedulingPolicy", "vllm.v1.core.sched.request_queue.create_request_queue" ], "n_typable": 48, "n_typed": 48, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 31, "n_method_overloads": 31, "n_method_params": 15, "n_classes": 4, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/core/sched/scheduler.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.core.sched.scheduler.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.core.sched.scheduler.Scheduler", "methods": [ { "kind": "function", "name": "Scheduler.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Scheduler._mamba_block_aligned_split", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Scheduler.schedule", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Scheduler._preempt_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Scheduler._update_after_schedule", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Scheduler._update_request_as_session", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Scheduler._make_cached_request_data", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Scheduler._try_schedule_encoder_inputs", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Scheduler.get_grammar_bitmask", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Scheduler.update_from_output", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Scheduler._handle_stopped_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Scheduler._get_routed_experts", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Scheduler._update_request_with_output", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Scheduler._free_encoder_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Scheduler.update_draft_token_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Scheduler.update_draft_token_ids_in_output", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Scheduler.get_request_counts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Scheduler.add_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Scheduler.finish_requests", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Scheduler._free_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Scheduler._free_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Scheduler.set_pause_state", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Scheduler.get_num_unfinished_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Scheduler.has_finished_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Scheduler.reset_prefix_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Scheduler.reset_connector_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Scheduler.reset_encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Scheduler.make_stats", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Scheduler._get_encoder_cache_usage", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Scheduler.make_spec_decoding_stats", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Scheduler.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Scheduler.get_kv_connector", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Scheduler._connector_finished", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Scheduler._update_waiting_for_remote_kv", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Scheduler._update_from_kv_xfer_finished", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Scheduler._update_requests_with_invalid_blocks", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Scheduler._handle_invalid_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Scheduler.pause_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Scheduler.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.lora_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.kv_cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.kv_events_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.log_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.observability_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.kv_metrics_collector", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.structured_output_manager", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.is_encoder_decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.finished_req_ids_dict", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.prev_step_scheduled_req_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.max_num_running_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.max_num_scheduled_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.enable_kv_cache_events", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.connector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.connector_prefix_cache_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.recompute_kv_load_failures", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.kv_event_publisher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.ec_connector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.dcp_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.pcp_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.waiting", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.running", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.finished_req_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.num_waiting_for_streaming_input", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.finished_recving_kv_req_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.failed_recving_kv_req_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.supports_mm_inputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.mm_budget", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.max_num_encoder_input_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.encoder_cache_manager", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.use_eagle", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.num_spec_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.num_lookahead_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.kv_cache_manager", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.use_pp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.use_v2_model_runner", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.has_mamba_layers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.needs_kv_cache_zeroing", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.need_mamba_block_aligned_split", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.perf_metrics", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.policy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.routed_experts_reader", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Scheduler.max_num_kv_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 150, "n_typed": 109, "n_any": 0, "n_untyped": 41, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 37, "n_method_overloads": 37, "n_method_params": 62, "n_attrs": 50, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.v1.core.sched.scheduler", "names": [ "vllm.v1.core.sched.scheduler.Scheduler", "vllm.v1.core.sched.scheduler.logger" ], "n_typable": 151, "n_typed": 109, "n_any": 0, "n_untyped": 42, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 37, "n_method_overloads": 37, "n_method_params": 62, "n_classes": 1, "n_attrs": 51, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/core/sched/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.core.sched.utils.remove_all", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.core.sched.utils.check_stop", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.core.sched.utils.check_sequence_repetition", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.v1.core.sched.utils", "names": [ "vllm.v1.core.sched.utils.check_sequence_repetition", "vllm.v1.core.sched.utils.check_stop", "vllm.v1.core.sched.utils.remove_all" ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/core/single_type_kv_cache_manager.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.core.single_type_kv_cache_manager.SingleTypeKVCacheManager", "methods": [ { "kind": "function", "name": "SingleTypeKVCacheManager.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "SingleTypeKVCacheManager._get_num_evictable_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SingleTypeKVCacheManager.get_num_blocks_to_allocate", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "SingleTypeKVCacheManager.allocate_new_computed_blocks", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SingleTypeKVCacheManager.allocate_new_blocks", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SingleTypeKVCacheManager.take_new_block_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SingleTypeKVCacheManager.cache_blocks", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTypeKVCacheManager.free", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SingleTypeKVCacheManager.get_num_common_prefix_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SingleTypeKVCacheManager.find_longest_cache_hit", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "SingleTypeKVCacheManager.remove_skipped_blocks", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTypeKVCacheManager.get_num_skipped_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SingleTypeKVCacheManager.new_step_starts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SingleTypeKVCacheManager.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleTypeKVCacheManager.dcp_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleTypeKVCacheManager.pcp_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleTypeKVCacheManager.kv_cache_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleTypeKVCacheManager.block_pool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleTypeKVCacheManager.enable_caching", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleTypeKVCacheManager.new_block_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SingleTypeKVCacheManager.req_to_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SingleTypeKVCacheManager.num_cached_block", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SingleTypeKVCacheManager.kv_cache_group_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 58, "n_typed": 50, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 35, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.core.single_type_kv_cache_manager.SinkFullAttentionManager", "methods": [ { "kind": "function", "name": "SinkFullAttentionManager.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SinkFullAttentionManager.sink_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 6, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.core.single_type_kv_cache_manager.FullAttentionManager", "methods": [ { "kind": "function", "name": "FullAttentionManager.find_longest_cache_hit", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "FullAttentionManager.get_num_common_prefix_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 10, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.core.single_type_kv_cache_manager.SlidingWindowManager", "methods": [ { "kind": "function", "name": "SlidingWindowManager.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SlidingWindowManager.find_longest_cache_hit", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "SlidingWindowManager.get_num_skipped_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SlidingWindowManager.get_num_common_prefix_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SlidingWindowManager.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.core.single_type_kv_cache_manager.spec_manager_map", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.core.single_type_kv_cache_manager.CrossAttentionManager", "methods": [ { "kind": "function", "name": "CrossAttentionManager.allocate_new_computed_blocks", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CrossAttentionManager.cache_blocks", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CrossAttentionManager.get_num_common_prefix_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CrossAttentionManager.find_longest_cache_hit", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "properties": [], "attrs": [], "n_typable": 20, "n_typed": 20, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 16, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.core.single_type_kv_cache_manager.MambaManager", "methods": [ { "kind": "function", "name": "MambaManager.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MambaManager.find_longest_cache_hit", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "MambaManager.remove_skipped_blocks", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MambaManager.get_num_common_prefix_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MambaManager.get_num_blocks_to_allocate", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MambaManager.allocate_new_blocks", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MambaManager.free", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MambaManager.get_num_skipped_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MambaManager.cache_blocks", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MambaManager.new_step_starts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MambaManager.cached_blocks_this_step", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MambaManager.mamba_cache_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MambaManager.num_speculative_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MambaManager.last_state_block_idx", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 41, "n_typed": 39, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 27, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.core.single_type_kv_cache_manager.ChunkedLocalAttentionManager", "methods": [ { "kind": "function", "name": "ChunkedLocalAttentionManager.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ChunkedLocalAttentionManager.find_longest_cache_hit", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "ChunkedLocalAttentionManager.get_num_skipped_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ChunkedLocalAttentionManager.get_num_common_prefix_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChunkedLocalAttentionManager.attention_chunk_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.core.single_type_kv_cache_manager.get_manager_for_kv_cache_spec", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.v1.core.single_type_kv_cache_manager", "names": [ "vllm.v1.core.single_type_kv_cache_manager.ChunkedLocalAttentionManager", "vllm.v1.core.single_type_kv_cache_manager.CrossAttentionManager", "vllm.v1.core.single_type_kv_cache_manager.FullAttentionManager", "vllm.v1.core.single_type_kv_cache_manager.MambaManager", "vllm.v1.core.single_type_kv_cache_manager.SingleTypeKVCacheManager", "vllm.v1.core.single_type_kv_cache_manager.SinkFullAttentionManager", "vllm.v1.core.single_type_kv_cache_manager.SlidingWindowManager", "vllm.v1.core.single_type_kv_cache_manager.get_manager_for_kv_cache_spec", "vllm.v1.core.single_type_kv_cache_manager.spec_manager_map" ], "n_typable": 179, "n_typed": 162, "n_any": 0, "n_untyped": 17, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 38, "n_method_overloads": 38, "n_method_params": 120, "n_classes": 7, "n_attrs": 18, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/cudagraph_dispatcher.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.cudagraph_dispatcher.CudagraphDispatcher", "methods": [ { "kind": "function", "name": "CudagraphDispatcher.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CudagraphDispatcher._compute_bs_to_padded_graph_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudagraphDispatcher._get_lora_cases", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudagraphDispatcher._create_padded_batch_descriptor", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "CudagraphDispatcher.add_cudagraph_key", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CudagraphDispatcher.initialize_cudagraph_keys", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CudagraphDispatcher.dispatch", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CudagraphDispatcher.get_capture_descs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CudagraphDispatcher.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudagraphDispatcher.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudagraphDispatcher.uniform_decode_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudagraphDispatcher.cudagraph_keys", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudagraphDispatcher.keys_initialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudagraphDispatcher.specialize_lora_count", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudagraphDispatcher.cudagraph_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 21, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 15, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.cudagraph_dispatcher.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.cudagraph_dispatcher", "names": [ "vllm.v1.cudagraph_dispatcher.CudagraphDispatcher", "vllm.v1.cudagraph_dispatcher.logger" ], "n_typable": 31, "n_typed": 21, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 15, "n_classes": 1, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/engine/__init__.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.engine.EngineCoreEventType", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EngineCoreEventType.QUEUED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineCoreEventType.SCHEDULED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineCoreEventType.PREEMPTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.UtilityOutput", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "UtilityOutput.call_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UtilityOutput.failure_message", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UtilityOutput.result", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.ReconfigureRankType", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ReconfigureRankType.KEEP_CURRENT_RANK", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ReconfigureRankType.SHUTDOWN_CURRENT_RANK", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.ReconfigureDistributedRequest", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ReconfigureDistributedRequest.new_data_parallel_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ReconfigureDistributedRequest.new_data_parallel_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ReconfigureDistributedRequest.new_data_parallel_rank_local", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ReconfigureDistributedRequest.new_data_parallel_master_ip", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ReconfigureDistributedRequest.new_data_parallel_master_port", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ReconfigureDistributedRequest.new_data_parallel_master_port_list", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ReconfigureDistributedRequest.new_stateless_world_group_port_list", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ReconfigureDistributedRequest.new_stateless_dp_group_port_list", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ReconfigureDistributedRequest.new_stateless_ep_group_port_list", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ReconfigureDistributedRequest.new_stateless_eplb_group_port_list", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 10, "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.engine.EEP_NOTIFICATION_CALL_ID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.engine.EngineCoreOutputs", "methods": [ { "kind": "function", "name": "EngineCoreOutputs.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EngineCoreOutputs.engine_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutputs.outputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutputs.scheduler_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutputs.timestamp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutputs.utility_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutputs.finished_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutputs.wave_complete", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutputs.start_wave", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.EngineCoreEvent", "methods": [ { "kind": "function", "name": "EngineCoreEvent.new_event", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EngineCoreEvent.type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreEvent.timestamp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.engine.FINISH_REASON_STRINGS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.engine.PauseMode", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.engine.EEPNotificationType", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EEPNotificationType.NEW_CORE_ENGINES_INIT_READY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EEPNotificationType.NEW_CORE_ENGINES_WEIGHTS_INIT_READY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EEPNotificationType.RECONFIGURE_FINISHED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EEPNotificationType.SHUTDOWN_COMPLETE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.FinishReason", "methods": [ { "kind": "function", "name": "FinishReason.__str__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FinishReason.STOP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FinishReason.LENGTH", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FinishReason.ABORT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FinishReason.ERROR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FinishReason.REPETITION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.EngineCoreRequestType", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EngineCoreRequestType.ADD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineCoreRequestType.ABORT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineCoreRequestType.START_DP_WAVE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineCoreRequestType.UTILITY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineCoreRequestType.EXECUTOR_FAILED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.EngineCoreOutput", "methods": [], "properties": [ { "kind": "property", "name": "EngineCoreOutput.finished", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "EngineCoreOutput.request_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutput.new_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutput.new_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutput.new_prompt_logprobs_tensors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutput.pooling_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutput.finish_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutput.stop_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutput.events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutput.kv_transfer_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutput.trace_headers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutput.num_cached_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutput.num_external_computed_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutput.routed_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreOutput.num_nans_in_logits", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 15, "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 14, "n_properties": 1 }, { "kind": "class", "name": "vllm.v1.engine.EngineCoreRequest", "methods": [], "properties": [ { "kind": "property", "name": "EngineCoreRequest.params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "EngineCoreRequest.eos_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "EngineCoreRequest.request_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.prompt_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.mm_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.sampling_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.pooling_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.arrival_time", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.lora_request", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.cache_salt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.data_parallel_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.prompt_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.client_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.current_wave", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.priority", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.trace_headers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.resumable", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.external_req_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreRequest.reasoning_ended", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 19, "n_typed": 19, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 17, "n_properties": 2 } ], "type_ignores": [ { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] } ], "name": "vllm.v1.engine", "names": [ "vllm.v1.engine.EEPNotificationType", "vllm.v1.engine.EEP_NOTIFICATION_CALL_ID", "vllm.v1.engine.EngineCoreEvent", "vllm.v1.engine.EngineCoreEventType", "vllm.v1.engine.EngineCoreOutput", "vllm.v1.engine.EngineCoreOutputs", "vllm.v1.engine.EngineCoreRequest", "vllm.v1.engine.EngineCoreRequestType", "vllm.v1.engine.FINISH_REASON_STRINGS", "vllm.v1.engine.FinishReason", "vllm.v1.engine.PauseMode", "vllm.v1.engine.ReconfigureDistributedRequest", "vllm.v1.engine.ReconfigureRankType", "vllm.v1.engine.UtilityOutput" ], "n_typable": 63, "n_typed": 61, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_classes": 11, "n_attrs": 76, "n_properties": 3, "n_type_ignores": 11 }, { "path": "vllm/v1/engine/coordinator.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.engine.coordinator.DPCoordinator", "methods": [ { "kind": "function", "name": "DPCoordinator.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DPCoordinator.get_stats_publish_address", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DPCoordinator.get_engine_socket_addresses", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DPCoordinator.close", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DPCoordinator.proc", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DPCoordinator.stats_publish_address", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DPCoordinator.coord_in_address", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DPCoordinator.coord_out_address", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.coordinator.DPCoordinatorProc", "methods": [ { "kind": "function", "name": "DPCoordinatorProc.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DPCoordinatorProc.run_coordinator", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "DPCoordinatorProc.process_input_socket", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DPCoordinatorProc._send_start_wave", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DPCoordinatorProc._get_engine_counts", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DPCoordinatorProc.ctx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DPCoordinatorProc.engines", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DPCoordinatorProc.stats_update_interval_ms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DPCoordinatorProc.enable_wave_coordination", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 16, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 16, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.engine.coordinator.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.engine.coordinator.EngineState", "methods": [ { "kind": "function", "name": "EngineState.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EngineState.request_counts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 2, "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.engine.coordinator", "names": [ "vllm.v1.engine.coordinator.DPCoordinator", "vllm.v1.engine.coordinator.DPCoordinatorProc", "vllm.v1.engine.coordinator.EngineState", "vllm.v1.engine.coordinator.logger" ], "n_typable": 38, "n_typed": 21, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 18, "n_classes": 3, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/engine/core.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.engine.core.EngineCoreActorMixin", "methods": [ { "kind": "function", "name": "EngineCoreActorMixin.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EngineCoreActorMixin._set_visible_devices", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineCoreActorMixin._set_cuda_visible_devices", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EngineCoreActorMixin._perform_handshakes", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "EngineCoreActorMixin.wait_for_init", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreActorMixin.run", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EngineCoreActorMixin.addresses", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 21, "n_typed": 14, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 14, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.core.DPMoEEngineCoreActor", "methods": [ { "kind": "function", "name": "DPMoEEngineCoreActor.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.core.DPEngineCoreProc", "methods": [ { "kind": "function", "name": "DPEngineCoreProc.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "DPEngineCoreProc._init_data_parallel", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DPEngineCoreProc.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DPEngineCoreProc.add_request", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DPEngineCoreProc.resume_scheduler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DPEngineCoreProc._handle_client_request", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DPEngineCoreProc._maybe_publish_request_counts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DPEngineCoreProc.run_busy_loop", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DPEngineCoreProc._has_global_unfinished_reqs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DPEngineCoreProc.reinitialize_distributed", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DPEngineCoreProc._eep_send_engine_core_notification", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DPEngineCoreProc.eep_handle_engine_core_notification", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DPEngineCoreProc._eep_scale_up_before_kv_init", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DPEngineCoreProc.step_counter", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DPEngineCoreProc.current_wave", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DPEngineCoreProc.last_counts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DPEngineCoreProc.eep_scaling_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 33, "n_typed": 19, "n_any": 1, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 16, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.core.EngineCoreActor", "methods": [ { "kind": "function", "name": "EngineCoreActor.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.engine.core.HANDSHAKE_TIMEOUT_MINS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.engine.core.EngineCore", "methods": [ { "kind": "function", "name": "EngineCore.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "EngineCore._initialize_kv_caches", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCore.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCore.add_request", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineCore.abort_requests", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCore.log_error_detail", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCore.log_iteration_details", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCore.step", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCore.post_step", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCore.step_with_batch_queue", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCore._process_aborts_queue", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCore.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCore.profile", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineCore.reset_mm_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCore.reset_prefix_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineCore.reset_encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCore._reset_caches", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCore.pause_scheduler", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineCore.resume_scheduler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCore.is_scheduler_paused", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCore.sleep", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineCore.wake_up", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCore.is_sleeping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCore.execute_dummy_batch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCore.add_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCore.remove_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCore.list_loras", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCore.pin_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCore.save_sharded_state", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EngineCore.collective_rpc", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EngineCore.preprocess_add_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCore._eep_scale_up_before_kv_init", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCore._eep_send_engine_core_notification", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EngineCore.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.log_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.model_executor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.available_gpu_memory_for_kv_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.structured_output_manager", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.scheduler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.use_spec_decode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.mm_registry", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.mm_receiver_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.batch_queue_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.batch_queue", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.is_ec_producer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.request_block_hasher", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.step_fn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.async_scheduling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCore.aborts_queue", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 85, "n_typed": 57, "n_any": 0, "n_untyped": 28, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 33, "n_method_overloads": 33, "n_method_params": 35, "n_attrs": 17, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.engine.core.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.engine.core.EngineCoreProc", "methods": [ { "kind": "function", "name": "EngineCoreProc.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "EngineCoreProc._perform_handshakes", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "EngineCoreProc._perform_handshake", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "EngineCoreProc.startup_handshake", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EngineCoreProc.run_engine_core", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EngineCoreProc._init_data_parallel", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCoreProc.has_work", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreProc.run_busy_loop", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreProc._process_input_queue", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreProc._process_engine_step", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreProc._notify_idle_state_callbacks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreProc._handle_client_request", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineCoreProc._invoke_utility_method", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EngineCoreProc._convert_msgspec_args", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineCoreProc._send_engine_dead", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreProc.process_input_sockets", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EngineCoreProc.process_output_sockets", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EngineCoreProc._handle_request_preproc_error", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCoreProc.pause_scheduler", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineCoreProc._send_abort_outputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EngineCoreProc.ENGINE_CORE_DEAD", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineCoreProc.addresses", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreProc.input_queue", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreProc.output_queue", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreProc.engine_index", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreProc.engines_running", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreProc.client_count", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreProc.has_coordinator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreProc.frontend_stats_publish_address", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreProc.publish_dp_lb_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreProc.process_input_queue_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EngineCoreProc.output_thread", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 78, "n_typed": 53, "n_any": 1, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 20, "n_method_overloads": 20, "n_method_params": 47, "n_attrs": 12, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.engine.core", "names": [ "vllm.v1.engine.core.DPEngineCoreProc", "vllm.v1.engine.core.DPMoEEngineCoreActor", "vllm.v1.engine.core.EngineCore", "vllm.v1.engine.core.EngineCoreActor", "vllm.v1.engine.core.EngineCoreActorMixin", "vllm.v1.engine.core.EngineCoreProc", "vllm.v1.engine.core.HANDSHAKE_TIMEOUT_MINS", "vllm.v1.engine.core.logger" ], "n_typable": 234, "n_typed": 157, "n_any": 2, "n_untyped": 75, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 74, "n_method_overloads": 74, "n_method_params": 126, "n_classes": 6, "n_attrs": 36, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/engine/core_client.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.engine.core_client.EngineIdentity", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.engine.core_client.AnyFuture", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.engine.core_client.SyncMPClient", "methods": [ { "kind": "function", "name": "SyncMPClient.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SyncMPClient.get_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SyncMPClient._send_input", "n_typed": 1, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SyncMPClient.call_utility", "n_typed": 1, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SyncMPClient.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SyncMPClient.add_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SyncMPClient.abort_requests", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SyncMPClient.profile", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SyncMPClient.reset_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SyncMPClient.reset_prefix_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SyncMPClient.reset_encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SyncMPClient.add_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SyncMPClient.remove_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SyncMPClient.list_loras", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SyncMPClient.pin_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SyncMPClient.sleep", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SyncMPClient.wake_up", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SyncMPClient.is_sleeping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SyncMPClient.execute_dummy_batch", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SyncMPClient.collective_rpc", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SyncMPClient.save_sharded_state", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SyncMPClient.is_dp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SyncMPClient.outputs_queue", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SyncMPClient.output_queue_thread", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 50, "n_typed": 42, "n_any": 2, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 26, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.core_client.InprocClient", "methods": [ { "kind": "function", "name": "InprocClient.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InprocClient.get_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InprocClient.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InprocClient.add_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InprocClient.abort_requests", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InprocClient.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InprocClient.profile", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InprocClient.reset_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InprocClient.reset_prefix_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InprocClient.reset_encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InprocClient.sleep", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InprocClient.wake_up", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InprocClient.is_sleeping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InprocClient.execute_dummy_batch", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InprocClient.add_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InprocClient.remove_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InprocClient.list_loras", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InprocClient.pin_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InprocClient.save_sharded_state", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InprocClient.collective_rpc", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "InprocClient.dp_engines_running", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InprocClient.engine_core", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 43, "n_typed": 39, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 21, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.core_client.ElasticScalingCache", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ElasticScalingCache.existing_core_engines", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ElasticScalingCache.num_new_core_engines", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ElasticScalingCache.pending_notifications", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.core_client.MPClient", "methods": [ { "kind": "function", "name": "MPClient.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "MPClient.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MPClient._format_exception", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MPClient.ensure_alive", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MPClient.add_pending_message", "n_typed": 1, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MPClient.free_pending_messages", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MPClient.dp_engines_running", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MPClient.start_engine_core_monitor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MPClient.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPClient.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPClient.decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPClient.ctx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPClient.resources", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPClient.engines_running", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPClient.stats_update_address", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MPClient.engine_ranks_managed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPClient.core_engines", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MPClient.core_engine", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MPClient.utility_results", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MPClient.pending_messages", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MPClient.input_socket", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 13, "n_any": 1, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 8, "n_attrs": 13, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.engine.core_client.allocate_stateless_group_ports", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.v1.engine.core_client.BackgroundResources", "methods": [ { "kind": "function", "name": "BackgroundResources.__call__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BackgroundResources.validate_alive", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BackgroundResources.ctx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BackgroundResources.engine_manager", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BackgroundResources.coordinator", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BackgroundResources.output_socket", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BackgroundResources.input_socket", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BackgroundResources.first_req_send_socket", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BackgroundResources.first_req_rcv_socket", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BackgroundResources.stats_update_socket", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BackgroundResources.output_queue_task", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BackgroundResources.stats_update_task", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BackgroundResources.shutdown_path", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BackgroundResources.engine_dead", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.core_client.EngineCoreClient", "methods": [ { "kind": "function", "name": "EngineCoreClient.make_client", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "EngineCoreClient.make_async_mp_client", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "EngineCoreClient.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.get_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.add_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCoreClient.profile", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineCoreClient.reset_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.reset_prefix_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineCoreClient.reset_encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.sleep", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineCoreClient.wake_up", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCoreClient.is_sleeping", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.execute_dummy_batch", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.execute_dummy_batch_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.abort_requests", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCoreClient.add_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCoreClient.remove_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCoreClient.list_loras", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.pin_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCoreClient.save_sharded_state", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EngineCoreClient.collective_rpc", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EngineCoreClient.dp_engines_running", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.scale_elastic_ep", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCoreClient.get_output_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.get_supported_tasks_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.add_request_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCoreClient.profile_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineCoreClient.reset_mm_cache_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.reset_prefix_cache_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineCoreClient.reset_encoder_cache_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.sleep_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EngineCoreClient.wake_up_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCoreClient.is_sleeping_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.abort_requests_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCoreClient.add_lora_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCoreClient.remove_lora_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCoreClient.list_loras_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EngineCoreClient.pin_lora_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EngineCoreClient.save_sharded_state_async", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "EngineCoreClient.collective_rpc_async", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [], "n_typable": 91, "n_typed": 90, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 41, "n_method_overloads": 41, "n_method_params": 50, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.core_client.DPAsyncMPClient", "methods": [ { "kind": "function", "name": "DPAsyncMPClient.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "DPAsyncMPClient._ensure_stats_update_task", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DPAsyncMPClient.add_request_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DPAsyncMPClient.get_core_engine_for_request", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DPAsyncMPClient.current_wave", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DPAsyncMPClient.lb_engines", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DPAsyncMPClient.eep_scaling_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DPAsyncMPClient.first_req_sock_addr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DPAsyncMPClient.first_req_send_socket", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.core_client.DPLBAsyncMPClient", "methods": [ { "kind": "function", "name": "DPLBAsyncMPClient.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "DPLBAsyncMPClient.get_core_engine_for_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DPLBAsyncMPClient.call_utility_async", "n_typed": 1, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DPLBAsyncMPClient.process_engine_outputs", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DPLBAsyncMPClient.eep_process_engine_core_notification", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DPLBAsyncMPClient.abort_requests_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DPLBAsyncMPClient._abort_requests", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DPLBAsyncMPClient.scale_elastic_ep", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DPLBAsyncMPClient._eep_wait_for_setup_switch_complete", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DPLBAsyncMPClient._scale_up_elastic_ep", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DPLBAsyncMPClient._scale_down_elastic_ep", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DPLBAsyncMPClient.client_count", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DPLBAsyncMPClient.reqs_in_flight", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DPLBAsyncMPClient.eng_start_index", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 28, "n_any": 1, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 21, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.engine.core_client.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.engine.core_client.AsyncMPClient", "methods": [ { "kind": "function", "name": "AsyncMPClient.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "AsyncMPClient._ensure_output_queue_task", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncMPClient.get_output_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncMPClient._send_input", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AsyncMPClient._send_input_message", "n_typed": 3, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AsyncMPClient.call_utility_async", "n_typed": 1, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMPClient._call_utility_async", "n_typed": 2, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AsyncMPClient.get_supported_tasks_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncMPClient.add_request_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncMPClient.abort_requests_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncMPClient.pause_scheduler_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMPClient.resume_scheduler_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncMPClient.is_scheduler_paused_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncMPClient.profile_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMPClient.reset_mm_cache_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncMPClient.reset_prefix_cache_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMPClient.reset_encoder_cache_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncMPClient.sleep_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AsyncMPClient.wake_up_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncMPClient.is_sleeping_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncMPClient.execute_dummy_batch_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncMPClient.add_lora_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncMPClient.remove_lora_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncMPClient.list_loras_async", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncMPClient.pin_lora_async", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AsyncMPClient.save_sharded_state_async", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AsyncMPClient.collective_rpc_async", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AsyncMPClient.client_count", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncMPClient.client_index", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncMPClient.outputs_queue", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 68, "n_typed": 57, "n_any": 4, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 27, "n_method_overloads": 27, "n_method_params": 38, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.engine.core_client", "names": [ "vllm.v1.engine.core_client.AnyFuture", "vllm.v1.engine.core_client.AsyncMPClient", "vllm.v1.engine.core_client.BackgroundResources", "vllm.v1.engine.core_client.DPAsyncMPClient", "vllm.v1.engine.core_client.DPLBAsyncMPClient", "vllm.v1.engine.core_client.ElasticScalingCache", "vllm.v1.engine.core_client.EngineCoreClient", "vllm.v1.engine.core_client.EngineIdentity", "vllm.v1.engine.core_client.InprocClient", "vllm.v1.engine.core_client.MPClient", "vllm.v1.engine.core_client.SyncMPClient", "vllm.v1.engine.core_client.allocate_stateless_group_ports", "vllm.v1.engine.core_client.logger" ], "n_typable": 341, "n_typed": 283, "n_any": 8, "n_untyped": 50, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 135, "n_method_overloads": 135, "n_method_params": 173, "n_classes": 9, "n_attrs": 46, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/engine/detokenizer.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.engine.detokenizer.INVALID_PREFIX_ERR_MSG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.engine.detokenizer.SlowIncrementalDetokenizer", "methods": [ { "kind": "function", "name": "SlowIncrementalDetokenizer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SlowIncrementalDetokenizer.num_output_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SlowIncrementalDetokenizer.decode_next", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "SlowIncrementalDetokenizer.output_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "SlowIncrementalDetokenizer.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SlowIncrementalDetokenizer.prompt_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SlowIncrementalDetokenizer.skip_special_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SlowIncrementalDetokenizer.spaces_between_special_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SlowIncrementalDetokenizer.tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SlowIncrementalDetokenizer.prefix_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SlowIncrementalDetokenizer.read_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 6, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 7, "n_properties": 1 }, { "kind": "function", "name": "vllm.v1.engine.detokenizer.check_stop_strings", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.v1.engine.detokenizer.IncrementalDetokenizer", "methods": [ { "kind": "function", "name": "IncrementalDetokenizer.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "IncrementalDetokenizer.num_output_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "IncrementalDetokenizer.update", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "IncrementalDetokenizer.get_next_output_text", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "IncrementalDetokenizer.from_new_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "IncrementalDetokenizer.output_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "IncrementalDetokenizer.token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 13, "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_attrs": 1, "n_properties": 1 }, { "kind": "attr", "name": "vllm.v1.engine.detokenizer.USE_FAST_DETOKENIZER", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.engine.detokenizer.BaseIncrementalDetokenizer", "methods": [ { "kind": "function", "name": "BaseIncrementalDetokenizer.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseIncrementalDetokenizer.update", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BaseIncrementalDetokenizer.decode_next", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BaseIncrementalDetokenizer.get_next_output_text", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseIncrementalDetokenizer.stop", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseIncrementalDetokenizer.min_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseIncrementalDetokenizer.include_stop_str_in_output", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseIncrementalDetokenizer.output_text", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BaseIncrementalDetokenizer.stop_buffer_length", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 9, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.detokenizer.FastIncrementalDetokenizer", "methods": [ { "kind": "function", "name": "FastIncrementalDetokenizer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FastIncrementalDetokenizer.decode_next", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FastIncrementalDetokenizer._protected_step", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FastIncrementalDetokenizer.request_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FastIncrementalDetokenizer.skip_special_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FastIncrementalDetokenizer.tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FastIncrementalDetokenizer.stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FastIncrementalDetokenizer.spaces_between_special_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FastIncrementalDetokenizer.last_special", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FastIncrementalDetokenizer.added_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 7, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 7, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.engine.detokenizer.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.engine.detokenizer", "names": [ "vllm.v1.engine.detokenizer.BaseIncrementalDetokenizer", "vllm.v1.engine.detokenizer.FastIncrementalDetokenizer", "vllm.v1.engine.detokenizer.INVALID_PREFIX_ERR_MSG", "vllm.v1.engine.detokenizer.IncrementalDetokenizer", "vllm.v1.engine.detokenizer.SlowIncrementalDetokenizer", "vllm.v1.engine.detokenizer.USE_FAST_DETOKENIZER", "vllm.v1.engine.detokenizer.check_stop_strings", "vllm.v1.engine.detokenizer.logger" ], "n_typable": 63, "n_typed": 39, "n_any": 0, "n_untyped": 24, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 19, "n_classes": 4, "n_attrs": 23, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/v1/engine/exceptions.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.engine.exceptions.EngineDeadError", "methods": [ { "kind": "function", "name": "EngineDeadError.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.exceptions.EngineGenerateError", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.engine.exceptions", "names": [ "vllm.v1.engine.exceptions.EngineDeadError", "vllm.v1.engine.exceptions.EngineGenerateError" ], "n_typable": 4, "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_classes": 2, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/engine/input_processor.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.engine.input_processor.InputProcessor", "methods": [ { "kind": "function", "name": "InputProcessor.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "InputProcessor.get_tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InputProcessor._validate_params", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputProcessor._validate_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InputProcessor._get_mm_identifier", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputProcessor.assign_request_id", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InputProcessor.process_inputs", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "InputProcessor._validate_prompt_len", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputProcessor._validate_model_input", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputProcessor._validate_model_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "InputProcessor.tokenizer", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "InputProcessor.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputProcessor.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputProcessor.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputProcessor.lora_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputProcessor.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputProcessor.speculative_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputProcessor.structured_outputs_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputProcessor.observability_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputProcessor.generation_config_fields", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputProcessor.renderer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputProcessor.supports_mm_inputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputProcessor.mm_encoder_cache_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputProcessor.skip_prompt_length_check", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputProcessor.input_preprocessor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 51, "n_typed": 34, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 26, "n_attrs": 14, "n_properties": 1 }, { "kind": "attr", "name": "vllm.v1.engine.input_processor.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.engine.input_processor", "names": [ "vllm.v1.engine.input_processor.InputProcessor", "vllm.v1.engine.input_processor.logger" ], "n_typable": 52, "n_typed": 34, "n_any": 0, "n_untyped": 18, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 26, "n_classes": 1, "n_attrs": 15, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/engine/logprobs.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.engine.logprobs.LogprobsProcessor", "methods": [ { "kind": "function", "name": "LogprobsProcessor.from_new_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LogprobsProcessor._update_sample_logprobs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LogprobsProcessor._update_prompt_logprobs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LogprobsProcessor.pop_prompt_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LogprobsProcessor._correct_decoded_token", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LogprobsProcessor._verify_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LogprobsProcessor.update_from_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LogprobsProcessor.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LogprobsProcessor.logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LogprobsProcessor.prompt_logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LogprobsProcessor.cumulative_logprob", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LogprobsProcessor.num_logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LogprobsProcessor.num_prompt_logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 9, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.engine.logprobs.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.engine.logprobs.NONES", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.engine.logprobs", "names": [ "vllm.v1.engine.logprobs.LogprobsProcessor", "vllm.v1.engine.logprobs.NONES", "vllm.v1.engine.logprobs.logger" ], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 9, "n_classes": 1, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/engine/output_processor.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.engine.output_processor.RequestOutputCollector", "methods": [ { "kind": "function", "name": "RequestOutputCollector.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RequestOutputCollector.put", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RequestOutputCollector.get", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RequestOutputCollector.get_nowait", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RequestOutputCollector.close", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RequestOutputCollector.__del__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RequestOutputCollector.aggregate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestOutputCollector.request_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestOutputCollector.output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RequestOutputCollector.ready", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 7, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 3, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.output_processor.StreamingUpdate", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "StreamingUpdate.prompt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingUpdate.prompt_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingUpdate.arrival_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingUpdate.final", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.output_processor.RequestState", "methods": [ { "kind": "function", "name": "RequestState.__init__", "n_typed": 20, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 21, "n_params": 20, "n_function_overloads": 1, "n_function_params": 20 }, { "kind": "function", "name": "RequestState.apply_streaming_update", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RequestState.from_new_request", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "RequestState.make_request_output", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "RequestState._new_request_output", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "RequestState._new_completion_output", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "RequestState._new_pooling_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RequestState.request_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.external_req_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.parent_req", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.request_index", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.lora_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.lora_name", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.output_kind", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.prompt", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.prompt_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.prompt_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.prompt_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.logprobs_processor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.detokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.max_tokens_param", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.top_p", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.n", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.temperature", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.is_prefilling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.queue", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.num_cached_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.stream_interval", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.sent_tokens_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.streaming_input", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.input_chunk_queue", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 76, "n_typed": 51, "n_any": 0, "n_untyped": 25, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 44, "n_attrs": 25, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.engine.output_processor.EMPTY_CPU_TENSOR", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.engine.output_processor.OutputProcessorOutput", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "OutputProcessorOutput.request_outputs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OutputProcessorOutput.reqs_to_abort", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.output_processor.OutputProcessor", "methods": [ { "kind": "function", "name": "OutputProcessor.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OutputProcessor.get_num_unfinished_requests", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OutputProcessor.has_unfinished_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OutputProcessor.propagate_error", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OutputProcessor.abort_requests", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OutputProcessor.add_request", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "OutputProcessor._update_streaming_request_state", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OutputProcessor.process_outputs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OutputProcessor._finish_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OutputProcessor.update_scheduler_stats", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OutputProcessor.do_tracing", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OutputProcessor._update_stats_from_output", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "OutputProcessor._update_stats_from_finished", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OutputProcessor.log_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OutputProcessor.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OutputProcessor.stream_interval", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OutputProcessor.request_states", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OutputProcessor.parent_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OutputProcessor.external_req_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OutputProcessor.lora_states", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OutputProcessor.tracing_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 51, "n_typed": 40, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 30, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.engine.output_processor", "names": [ "vllm.v1.engine.output_processor.EMPTY_CPU_TENSOR", "vllm.v1.engine.output_processor.OutputProcessor", "vllm.v1.engine.output_processor.OutputProcessorOutput", "vllm.v1.engine.output_processor.RequestOutputCollector", "vllm.v1.engine.output_processor.RequestState", "vllm.v1.engine.output_processor.StreamingUpdate" ], "n_typable": 141, "n_typed": 98, "n_any": 0, "n_untyped": 43, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 26, "n_method_overloads": 26, "n_method_params": 77, "n_classes": 5, "n_attrs": 44, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/engine/parallel_sampling.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.engine.parallel_sampling.ParentRequest", "methods": [ { "kind": "function", "name": "ParentRequest.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParentRequest._get_child_sampling_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParentRequest.get_child_info", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParentRequest.get_outputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ParentRequest.observe_num_generation_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParentRequest.observe_finished_request", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "ParentRequest.n", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "ParentRequest.request_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParentRequest.external_req_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParentRequest.sampling_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParentRequest.child_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParentRequest.output_aggregator", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParentRequest.max_num_generation_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ParentRequest.cached_child_sampling_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 23, "n_typed": 21, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_attrs": 7, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.v1.engine.parallel_sampling", "names": [ "vllm.v1.engine.parallel_sampling.ParentRequest" ], "n_typable": 23, "n_typed": 21, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 9, "n_classes": 1, "n_attrs": 7, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/engine/utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.engine.utils.CoreEngineActorManager", "methods": [ { "kind": "function", "name": "CoreEngineActorManager.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "CoreEngineActorManager.create_dp_placement_groups", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CoreEngineActorManager.add_dp_placement_groups", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CoreEngineActorManager.scale_up_elastic_ep", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CoreEngineActorManager.scale_down_elastic_ep", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CoreEngineActorManager.get_run_refs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CoreEngineActorManager.close", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CoreEngineActorManager.local_engine_actors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CoreEngineActorManager.remote_engine_actors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CoreEngineActorManager.env_vars_dict", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CoreEngineActorManager.addresses", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CoreEngineActorManager.executor_class", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CoreEngineActorManager.log_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CoreEngineActorManager.placement_group_is_local", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CoreEngineActorManager.run_refs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CoreEngineActorManager.created_placement_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 19, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 13, "n_attrs": 9, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.engine.utils.set_device_control_env_var", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.v1.engine.utils.CoreEngineProcManager", "methods": [ { "kind": "function", "name": "CoreEngineProcManager.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "CoreEngineProcManager.close", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CoreEngineProcManager.join_first", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CoreEngineProcManager.sentinels", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CoreEngineProcManager.finished_procs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CoreEngineProcManager.processes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 16, "n_typed": 13, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.engine.utils.get_device_indices", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.v1.engine.utils.get_engine_zmq_addresses", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.v1.engine.utils.CoreEngine", "methods": [ { "kind": "function", "name": "CoreEngine.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CoreEngine.local", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CoreEngine.identity", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CoreEngine.state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 2, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.utils.CoreEngineState", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CoreEngineState.NEW", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CoreEngineState.CONNECTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CoreEngineState.READY", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.engine.utils.EngineHandshakeMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EngineHandshakeMetadata.addresses", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineHandshakeMetadata.parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.engine.utils.wait_for_engine_startup", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "attr", "name": "vllm.v1.engine.utils.STARTUP_POLL_PERIOD_MS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.engine.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.engine.utils.EngineZmqAddresses", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "EngineZmqAddresses.inputs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineZmqAddresses.outputs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineZmqAddresses.coordinator_input", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineZmqAddresses.coordinator_output", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EngineZmqAddresses.frontend_stats_publish_address", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.engine.utils.launch_core_engines", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.v1.engine.utils", "names": [ "vllm.v1.engine.utils.CoreEngine", "vllm.v1.engine.utils.CoreEngineActorManager", "vllm.v1.engine.utils.CoreEngineProcManager", "vllm.v1.engine.utils.CoreEngineState", "vllm.v1.engine.utils.EngineHandshakeMetadata", "vllm.v1.engine.utils.EngineZmqAddresses", "vllm.v1.engine.utils.STARTUP_POLL_PERIOD_MS", "vllm.v1.engine.utils.get_device_indices", "vllm.v1.engine.utils.get_engine_zmq_addresses", "vllm.v1.engine.utils.launch_core_engines", "vllm.v1.engine.utils.logger", "vllm.v1.engine.utils.set_device_control_env_var", "vllm.v1.engine.utils.wait_for_engine_startup" ], "n_typable": 78, "n_typed": 58, "n_any": 0, "n_untyped": 20, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 21, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 25, "n_classes": 6, "n_attrs": 25, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/executor/abstract.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.executor.abstract.Executor", "methods": [ { "kind": "function", "name": "Executor.get_class", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Executor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Executor._init_executor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Executor.initialize_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Executor.register_failure_callback", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Executor.determine_available_memory", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Executor.get_kv_cache_specs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Executor.collective_rpc", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 6, "n_params": 5, "n_function_overloads": 2, "n_function_params": 5 }, { "kind": "function", "name": "Executor.get_kv_connector_handshake_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Executor.execute_model", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 3, "n_params": 2, "n_function_overloads": 2, "n_function_params": 2 }, { "kind": "function", "name": "Executor.sample_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 3, "n_params": 2, "n_function_overloads": 2, "n_function_params": 2 }, { "kind": "function", "name": "Executor.execute_dummy_batch", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Executor.take_draft_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Executor.profile", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Executor.save_sharded_state", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Executor.check_health", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Executor.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Executor.init_kv_output_aggregator", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Executor.add_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Executor.remove_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Executor.pin_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Executor.list_loras", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Executor.reset_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Executor.reset_encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Executor.sleep", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Executor.wake_up", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Executor.reinitialize_distributed", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Executor.max_concurrent_batches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Executor.supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Executor.uses_ray", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Executor.supports_pp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Executor.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Executor.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Executor.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Executor.lora_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Executor.load_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Executor.parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Executor.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Executor.device_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Executor.speculative_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Executor.observability_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Executor.is_sleeping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Executor.sleeping_tags", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Executor.kv_output_aggregator", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 69, "n_typed": 54, "n_any": 0, "n_untyped": 15, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 27, "n_method_overloads": 30, "n_method_params": 25, "n_attrs": 15, "n_properties": 2 }, { "kind": "attr", "name": "vllm.v1.executor.abstract.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.executor.abstract.FailureCallback", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.executor.abstract", "names": [ "vllm.v1.executor.abstract.Executor", "vllm.v1.executor.abstract.FailureCallback", "vllm.v1.executor.abstract.logger" ], "n_typable": 71, "n_typed": 55, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 27, "n_method_overloads": 30, "n_method_params": 25, "n_classes": 1, "n_attrs": 17, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/v1/executor/uniproc_executor.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.executor.uniproc_executor.UniProcExecutor", "methods": [ { "kind": "function", "name": "UniProcExecutor._init_executor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UniProcExecutor._distributed_args", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UniProcExecutor.collective_rpc", "n_typed": 6, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "UniProcExecutor.execute_model", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "UniProcExecutor.sample_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "UniProcExecutor.take_draft_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UniProcExecutor.check_health", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UniProcExecutor.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "UniProcExecutor.max_concurrent_batches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 19, "n_typed": 18, "n_any": 1, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 10, "n_attrs": 0, "n_properties": 1 }, { "kind": "attr", "name": "vllm.v1.executor.uniproc_executor.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.executor.uniproc_executor.ExecutorWithExternalLauncher", "methods": [ { "kind": "function", "name": "ExecutorWithExternalLauncher._init_executor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ExecutorWithExternalLauncher._distributed_args", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ExecutorWithExternalLauncher.determine_available_memory", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.executor.uniproc_executor", "names": [ "vllm.v1.executor.uniproc_executor.ExecutorWithExternalLauncher", "vllm.v1.executor.uniproc_executor.UniProcExecutor", "vllm.v1.executor.uniproc_executor.logger" ], "n_typable": 23, "n_typed": 21, "n_any": 1, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 10, "n_classes": 2, "n_attrs": 1, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/executor/multiproc_executor.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.executor.multiproc_executor.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.executor.multiproc_executor.WorkerProcHandle", "methods": [ { "kind": "function", "name": "WorkerProcHandle.from_unready_handle", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WorkerProcHandle.proc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WorkerProcHandle.rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WorkerProcHandle.worker_response_mq", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WorkerProcHandle.peer_worker_response_mqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WorkerProcHandle.death_writer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.executor.multiproc_executor.MultiprocExecutor", "methods": [ { "kind": "function", "name": "MultiprocExecutor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiprocExecutor._init_executor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiprocExecutor._get_parallel_sizes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiprocExecutor._post_init_executor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiprocExecutor._is_driver_worker", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiprocExecutor.start_worker_monitor", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiprocExecutor.register_failure_callback", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiprocExecutor.execute_model", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiprocExecutor.sample_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiprocExecutor.execute_dummy_batch", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiprocExecutor.take_draft_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiprocExecutor.collective_rpc", "n_typed": 7, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "MultiprocExecutor._ensure_worker_termination", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiprocExecutor.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiprocExecutor.check_health", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiprocExecutor._get_output_rank", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "MultiprocExecutor.max_concurrent_batches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MultiprocExecutor.supports_pp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MultiprocExecutor.monitor_workers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 36, "n_typed": 29, "n_any": 1, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 17, "n_attrs": 2, "n_properties": 1 }, { "kind": "class", "name": "vllm.v1.executor.multiproc_executor.WorkerProc", "methods": [ { "kind": "function", "name": "WorkerProc._init_message_queues", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WorkerProc.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "WorkerProc.make_worker_process", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "WorkerProc.wait_for_response_handle_ready", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WorkerProc.wait_for_ready", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerProc.shutdown", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerProc.worker_main", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WorkerProc.enqueue_output", "n_typed": 0, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerProc.handle_output", "n_typed": 0, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerProc.async_output_busy_loop", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerProc.worker_busy_loop", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerProc.setup_proc_title_and_log_prefix", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WorkerProc.READY_STR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "WorkerProc.rpc_broadcast_mq", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "WorkerProc.worker_response_mq", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "WorkerProc.rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerProc.worker", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerProc.use_async_scheduling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerProc.async_output_queue", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "WorkerProc.async_output_copy_thread", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 44, "n_typed": 28, "n_any": 2, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 25, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.executor.multiproc_executor.ResponseStatus", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ResponseStatus.SUCCESS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ResponseStatus.FAILURE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.executor.multiproc_executor.UnreadyWorkerProcHandle", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "UnreadyWorkerProcHandle.proc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UnreadyWorkerProcHandle.rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UnreadyWorkerProcHandle.ready_pipe", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UnreadyWorkerProcHandle.death_writer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.executor.multiproc_executor.set_multiprocessing_worker_envs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.v1.executor.multiproc_executor.FutureWrapper", "methods": [ { "kind": "function", "name": "FutureWrapper.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FutureWrapper.result", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FutureWrapper.wait_for_response", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FutureWrapper.futures_queue", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FutureWrapper.aggregate", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 9, "n_typed": 3, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.executor.multiproc_executor", "names": [ "vllm.v1.executor.multiproc_executor.FutureWrapper", "vllm.v1.executor.multiproc_executor.MultiprocExecutor", "vllm.v1.executor.multiproc_executor.ResponseStatus", "vllm.v1.executor.multiproc_executor.UnreadyWorkerProcHandle", "vllm.v1.executor.multiproc_executor.WorkerProc", "vllm.v1.executor.multiproc_executor.WorkerProcHandle", "vllm.v1.executor.multiproc_executor.logger", "vllm.v1.executor.multiproc_executor.set_multiprocessing_worker_envs" ], "n_typable": 95, "n_typed": 64, "n_any": 3, "n_untyped": 28, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 32, "n_method_overloads": 32, "n_method_params": 49, "n_classes": 6, "n_attrs": 24, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/executor/ray_executor.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.executor.ray_executor.RayWorkerMetaData", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RayWorkerMetaData.worker", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RayWorkerMetaData.created_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RayWorkerMetaData.adjusted_rank", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RayWorkerMetaData.ip", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.executor.ray_executor.COMPLETED_NONE_FUTURE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.executor.ray_executor.RayDistributedExecutor", "methods": [ { "kind": "function", "name": "RayDistributedExecutor._init_executor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RayDistributedExecutor.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RayDistributedExecutor._configure_ray_workers_use_nsight", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RayDistributedExecutor._update_noset_device_env_vars", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RayDistributedExecutor._get_env_vars_to_be_updated", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RayDistributedExecutor._init_workers_ray", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RayDistributedExecutor.reinitialize_distributed", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RayDistributedExecutor.execute_model", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RayDistributedExecutor.sample_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RayDistributedExecutor._execute_dag", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RayDistributedExecutor.collective_rpc", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "RayDistributedExecutor._check_ray_cgraph_installation", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RayDistributedExecutor._compiled_ray_dag", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RayDistributedExecutor.__del__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RayDistributedExecutor.check_health", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "RayDistributedExecutor.max_concurrent_batches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "RayDistributedExecutor.WORKER_SPECIFIC_ENV_VARS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RayDistributedExecutor.uses_ray", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RayDistributedExecutor.supports_pp", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 36, "n_typed": 27, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 18, "n_attrs": 3, "n_properties": 1 }, { "kind": "attr", "name": "vllm.v1.executor.ray_executor.ActorHandle", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.executor.ray_executor.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.executor.ray_executor", "names": [ "vllm.v1.executor.ray_executor.ActorHandle", "vllm.v1.executor.ray_executor.COMPLETED_NONE_FUTURE", "vllm.v1.executor.ray_executor.RayDistributedExecutor", "vllm.v1.executor.ray_executor.RayWorkerMetaData", "vllm.v1.executor.ray_executor.logger" ], "n_typable": 38, "n_typed": 28, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 18, "n_classes": 2, "n_attrs": 10, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/kv_cache_interface.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.kv_cache_interface.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.kv_cache_interface.KVCacheConfig", "methods": [], "properties": [ { "kind": "property", "name": "KVCacheConfig.has_mamba_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "KVCacheConfig.needs_kv_cache_zeroing", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "KVCacheConfig.num_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVCacheConfig.kv_cache_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVCacheConfig.kv_cache_groups", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 2 }, { "kind": "class", "name": "vllm.v1.kv_cache_interface.AttentionSpec", "methods": [], "properties": [ { "kind": "property", "name": "AttentionSpec.page_size_bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "AttentionSpec.real_page_size_bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "AttentionSpec.num_kv_heads", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionSpec.head_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionSpec.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionSpec.page_size_padded", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 2 }, { "kind": "class", "name": "vllm.v1.kv_cache_interface.SlidingWindowSpec", "methods": [ { "kind": "function", "name": "SlidingWindowSpec.max_memory_usage_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SlidingWindowSpec.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.kv_cache_interface.FullAttentionSpec", "methods": [ { "kind": "function", "name": "FullAttentionSpec.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FullAttentionSpec.max_memory_usage_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FullAttentionSpec.merge_window_sizes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FullAttentionSpec.merge", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "FullAttentionSpec.real_page_size_bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "FullAttentionSpec.head_size_v", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FullAttentionSpec.sliding_window", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FullAttentionSpec.attention_chunk_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 3, "n_properties": 1 }, { "kind": "class", "name": "vllm.v1.kv_cache_interface.KVCacheTensor", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KVCacheTensor.size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVCacheTensor.shared_by", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.kv_cache_interface.MambaSpec", "methods": [ { "kind": "function", "name": "MambaSpec.max_memory_usage_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "MambaSpec.page_size_bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MambaSpec.shapes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MambaSpec.dtypes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MambaSpec.page_size_padded", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MambaSpec.mamba_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MambaSpec.mamba_cache_mode", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MambaSpec.num_speculative_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 6, "n_properties": 1 }, { "kind": "class", "name": "vllm.v1.kv_cache_interface.EncoderOnlyAttentionSpec", "methods": [ { "kind": "function", "name": "EncoderOnlyAttentionSpec.max_memory_usage_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.kv_cache_interface.MLAAttentionSpec", "methods": [ { "kind": "function", "name": "MLAAttentionSpec.merge", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "MLAAttentionSpec.real_page_size_bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "MLAAttentionSpec.cache_dtype_str", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 1, "n_properties": 1 }, { "kind": "class", "name": "vllm.v1.kv_cache_interface.KVCacheGroupSpec", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KVCacheGroupSpec.layer_names", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVCacheGroupSpec.kv_cache_spec", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.kv_cache_interface.SinkFullAttentionSpec", "methods": [ { "kind": "function", "name": "SinkFullAttentionSpec.merge", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SinkFullAttentionSpec.sink_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.kv_cache_interface.KVCacheSpec", "methods": [ { "kind": "function", "name": "KVCacheSpec.max_memory_usage_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheSpec.copy_with_new_block_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVCacheSpec.merge", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "KVCacheSpec.page_size_bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "KVCacheSpec.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 1, "n_properties": 1 }, { "kind": "class", "name": "vllm.v1.kv_cache_interface.ChunkedLocalAttentionSpec", "methods": [ { "kind": "function", "name": "ChunkedLocalAttentionSpec.max_memory_usage_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ChunkedLocalAttentionSpec.attention_chunk_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.kv_cache_interface.CrossAttentionSpec", "methods": [ { "kind": "function", "name": "CrossAttentionSpec.max_memory_usage_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.kv_cache_interface.UniformTypeKVCacheSpecs", "methods": [ { "kind": "function", "name": "UniformTypeKVCacheSpecs.max_memory_usage_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UniformTypeKVCacheSpecs.is_uniform_type", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UniformTypeKVCacheSpecs.from_specs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "UniformTypeKVCacheSpecs.page_size_bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "UniformTypeKVCacheSpecs.kv_cache_specs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 1, "n_properties": 1 } ], "type_ignores": [ { "kind": "type", "rules": [ "assignment" ] } ], "name": "vllm.v1.kv_cache_interface", "names": [ "vllm.v1.kv_cache_interface.AttentionSpec", "vllm.v1.kv_cache_interface.ChunkedLocalAttentionSpec", "vllm.v1.kv_cache_interface.CrossAttentionSpec", "vllm.v1.kv_cache_interface.EncoderOnlyAttentionSpec", "vllm.v1.kv_cache_interface.FullAttentionSpec", "vllm.v1.kv_cache_interface.KVCacheConfig", "vllm.v1.kv_cache_interface.KVCacheGroupSpec", "vllm.v1.kv_cache_interface.KVCacheSpec", "vllm.v1.kv_cache_interface.KVCacheTensor", "vllm.v1.kv_cache_interface.MLAAttentionSpec", "vllm.v1.kv_cache_interface.MambaSpec", "vllm.v1.kv_cache_interface.SinkFullAttentionSpec", "vllm.v1.kv_cache_interface.SlidingWindowSpec", "vllm.v1.kv_cache_interface.UniformTypeKVCacheSpecs", "vllm.v1.kv_cache_interface.logger" ], "n_typable": 43, "n_typed": 41, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 16, "n_classes": 14, "n_attrs": 27, "n_properties": 9, "n_type_ignores": 1 }, { "path": "vllm/v1/kv_offload/abstract.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.kv_offload.abstract.LoadStoreSpec", "methods": [ { "kind": "function", "name": "LoadStoreSpec.medium", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.kv_offload.abstract.PrepareStoreOutput", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PrepareStoreOutput.block_hashes_to_store", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrepareStoreOutput.store_spec", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrepareStoreOutput.block_hashes_evicted", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.kv_offload.abstract.OffloadingManager", "methods": [ { "kind": "function", "name": "OffloadingManager.lookup", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingManager.prepare_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingManager.touch", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingManager.complete_load", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingManager.prepare_store", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OffloadingManager.complete_store", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OffloadingManager.take_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 14, "n_typed": 11, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.kv_offload.abstract.OffloadingEvent", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "OffloadingEvent.block_hashes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OffloadingEvent.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OffloadingEvent.medium", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OffloadingEvent.removed", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.kv_offload.abstract", "names": [ "vllm.v1.kv_offload.abstract.LoadStoreSpec", "vllm.v1.kv_offload.abstract.OffloadingEvent", "vllm.v1.kv_offload.abstract.OffloadingManager", "vllm.v1.kv_offload.abstract.PrepareStoreOutput" ], "n_typable": 15, "n_typed": 12, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 7, "n_classes": 4, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/kv_offload/arc_manager.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.kv_offload.arc_manager.ARCOffloadingManager", "methods": [ { "kind": "function", "name": "ARCOffloadingManager.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ARCOffloadingManager.lookup", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ARCOffloadingManager.prepare_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ARCOffloadingManager.touch", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ARCOffloadingManager.complete_load", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ARCOffloadingManager.prepare_store", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ARCOffloadingManager.complete_store", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ARCOffloadingManager.take_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ARCOffloadingManager.backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ARCOffloadingManager.target_t1_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ARCOffloadingManager.t1", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ARCOffloadingManager.t2", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ARCOffloadingManager.b1", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ARCOffloadingManager.b2", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ARCOffloadingManager.events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ARCOffloadingManager.cache_capacity", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 25, "n_typed": 21, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 9, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.kv_offload.arc_manager", "names": [ "vllm.v1.kv_offload.arc_manager.ARCOffloadingManager" ], "n_typable": 25, "n_typed": 21, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 9, "n_classes": 1, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/kv_offload/backend.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.kv_offload.backend.BlockStatus", "methods": [ { "kind": "function", "name": "BlockStatus.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "BlockStatus.is_ready", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "BlockStatus._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlockStatus.ref_cnt", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 2, "n_properties": 1 }, { "kind": "class", "name": "vllm.v1.kv_offload.backend.Backend", "methods": [ { "kind": "function", "name": "Backend.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Backend.get_num_free_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Backend.allocate_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Backend.free", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Backend.get_load_store_spec", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Backend.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Backend.medium", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.kv_offload.backend", "names": [ "vllm.v1.kv_offload.backend.Backend", "vllm.v1.kv_offload.backend.BlockStatus" ], "n_typable": 16, "n_typed": 9, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_classes": 2, "n_attrs": 4, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/kv_offload/backends/cpu.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.kv_offload.backends.cpu.CPUBlockStatus", "methods": [ { "kind": "function", "name": "CPUBlockStatus.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CPUBlockStatus._fields_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CPUBlockStatus.block_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.kv_offload.backends.cpu.CPUBackend", "methods": [ { "kind": "function", "name": "CPUBackend.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CPUBackend.get_num_free_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUBackend.allocate_blocks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUBackend.free", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUBackend.get_load_store_spec", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CPUBackend.num_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CPUBackend.num_allocated_blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CPUBackend.allocated_blocks_free_list", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 14, "n_typed": 11, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [ { "kind": "type", "rules": null } ], "name": "vllm.v1.kv_offload.backends.cpu", "names": [ "vllm.v1.kv_offload.backends.cpu.CPUBackend", "vllm.v1.kv_offload.backends.cpu.CPUBlockStatus" ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 7, "n_classes": 2, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 1 }, { "path": "vllm/v1/kv_offload/cpu.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.kv_offload.cpu.CPUOffloadingSpec", "methods": [ { "kind": "function", "name": "CPUOffloadingSpec.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CPUOffloadingSpec.get_manager", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUOffloadingSpec.get_handlers", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CPUOffloadingSpec.num_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUOffloadingSpec.eviction_policy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.kv_offload.cpu", "names": [ "vllm.v1.kv_offload.cpu.CPUOffloadingSpec" ], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/kv_offload/factory.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.kv_offload.factory.OffloadingSpecFactory", "methods": [ { "kind": "function", "name": "OffloadingSpecFactory.register_spec", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OffloadingSpecFactory.create_spec", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OffloadingSpecFactory._registry", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.kv_offload.factory.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.kv_offload.factory", "names": [ "vllm.v1.kv_offload.factory.OffloadingSpecFactory", "vllm.v1.kv_offload.factory.logger" ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/kv_offload/lru_manager.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.kv_offload.lru_manager.LRUOffloadingManager", "methods": [ { "kind": "function", "name": "LRUOffloadingManager.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LRUOffloadingManager.lookup", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUOffloadingManager.prepare_load", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUOffloadingManager.touch", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUOffloadingManager.complete_load", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUOffloadingManager.prepare_store", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LRUOffloadingManager.complete_store", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LRUOffloadingManager.take_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LRUOffloadingManager.backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LRUOffloadingManager.blocks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LRUOffloadingManager.events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 20, "n_typed": 16, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 9, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.kv_offload.lru_manager", "names": [ "vllm.v1.kv_offload.lru_manager.LRUOffloadingManager" ], "n_typable": 20, "n_typed": 16, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 9, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/kv_offload/mediums.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.kv_offload.mediums.CPULoadStoreSpec", "methods": [ { "kind": "function", "name": "CPULoadStoreSpec.medium", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.kv_offload.mediums.BlockIDsLoadStoreSpec", "methods": [ { "kind": "function", "name": "BlockIDsLoadStoreSpec.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BlockIDsLoadStoreSpec.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlockIDsLoadStoreSpec.block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.kv_offload.mediums.GPULoadStoreSpec", "methods": [ { "kind": "function", "name": "GPULoadStoreSpec.medium", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.kv_offload.mediums", "names": [ "vllm.v1.kv_offload.mediums.BlockIDsLoadStoreSpec", "vllm.v1.kv_offload.mediums.CPULoadStoreSpec", "vllm.v1.kv_offload.mediums.GPULoadStoreSpec" ], "n_typable": 6, "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 1, "n_classes": 3, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/kv_offload/spec.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.kv_offload.spec.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.kv_offload.spec.OffloadingSpec", "methods": [ { "kind": "function", "name": "OffloadingSpec.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OffloadingSpec.get_manager", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OffloadingSpec.get_handlers", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OffloadingSpec.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OffloadingSpec.kv_cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OffloadingSpec.extra_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OffloadingSpec.gpu_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "OffloadingSpec.offloaded_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 6, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.kv_offload.spec", "names": [ "vllm.v1.kv_offload.spec.OffloadingSpec", "vllm.v1.kv_offload.spec.logger" ], "n_typable": 13, "n_typed": 6, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/kv_offload/worker/cpu_gpu.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.kv_offload.worker.cpu_gpu.Transfer", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Transfer.job_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Transfer.stream", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Transfer.start_event", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Transfer.end_event", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Transfer.num_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.kv_offload.worker.cpu_gpu.expand_block_ids", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.v1.kv_offload.worker.cpu_gpu.CpuGpuOffloadingHandlers", "methods": [ { "kind": "function", "name": "CpuGpuOffloadingHandlers.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CpuGpuOffloadingHandlers.gpu_to_cpu_handler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CpuGpuOffloadingHandlers.cpu_to_gpu_handler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 5, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.kv_offload.worker.cpu_gpu.SingleDirectionOffloadingHandler", "methods": [ { "kind": "function", "name": "SingleDirectionOffloadingHandler.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SingleDirectionOffloadingHandler.transfer_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleDirectionOffloadingHandler.get_finished", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SingleDirectionOffloadingHandler.wait", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SingleDirectionOffloadingHandler.src_tensors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SingleDirectionOffloadingHandler.dst_tensors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SingleDirectionOffloadingHandler.src_block_size_factor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SingleDirectionOffloadingHandler.dst_block_size_factor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SingleDirectionOffloadingHandler.block_size_in_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleDirectionOffloadingHandler.total_block_size_in_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SingleDirectionOffloadingHandler.gpu_to_cpu", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SingleDirectionOffloadingHandler.transfer_type", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 14, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 8, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.kv_offload.worker.cpu_gpu.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.kv_offload.worker.cpu_gpu", "names": [ "vllm.v1.kv_offload.worker.cpu_gpu.CpuGpuOffloadingHandlers", "vllm.v1.kv_offload.worker.cpu_gpu.SingleDirectionOffloadingHandler", "vllm.v1.kv_offload.worker.cpu_gpu.Transfer", "vllm.v1.kv_offload.worker.cpu_gpu.expand_block_ids", "vllm.v1.kv_offload.worker.cpu_gpu.logger" ], "n_typable": 33, "n_typed": 23, "n_any": 0, "n_untyped": 10, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_classes": 3, "n_attrs": 16, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/kv_offload/worker/worker.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.kv_offload.worker.worker.OffloadingWorker", "methods": [ { "kind": "function", "name": "OffloadingWorker.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OffloadingWorker.register_handler", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "OffloadingWorker.transfer_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OffloadingWorker.get_finished", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OffloadingWorker.wait", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OffloadingWorker.handlers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "OffloadingWorker.transfer_type_to_handler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 13, "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.kv_offload.worker.worker.TransferType", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.kv_offload.worker.worker.OffloadingHandler", "methods": [ { "kind": "function", "name": "OffloadingHandler.transfer_async", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OffloadingHandler.get_finished", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OffloadingHandler.wait", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.kv_offload.worker.worker.TransferResult", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TransferResult.job_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TransferResult.success", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TransferResult.transfer_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TransferResult.transfer_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TransferResult.transfer_type", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.kv_offload.worker.worker.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.kv_offload.worker.worker.TransferSpec", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.v1.kv_offload.worker.worker", "names": [ "vllm.v1.kv_offload.worker.worker.OffloadingHandler", "vllm.v1.kv_offload.worker.worker.OffloadingWorker", "vllm.v1.kv_offload.worker.worker.TransferResult", "vllm.v1.kv_offload.worker.worker.TransferSpec", "vllm.v1.kv_offload.worker.worker.TransferType", "vllm.v1.kv_offload.worker.worker.logger" ], "n_typable": 20, "n_typed": 18, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 9, "n_classes": 3, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/metrics/loggers.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.metrics.loggers.AggregateStatLoggerFactory", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.metrics.loggers.load_stat_logger_plugin_factories", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.v1.metrics.loggers.StatLoggerBase", "methods": [ { "kind": "function", "name": "StatLoggerBase.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StatLoggerBase.record", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "StatLoggerBase.log_engine_initialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StatLoggerBase.log", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StatLoggerBase.record_sleep_state", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 8, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.loggers.PerEngineStatLoggerAdapter", "methods": [ { "kind": "function", "name": "PerEngineStatLoggerAdapter.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PerEngineStatLoggerAdapter.record", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PerEngineStatLoggerAdapter.log", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PerEngineStatLoggerAdapter.log_engine_initialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PerEngineStatLoggerAdapter.per_engine_stat_loggers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerEngineStatLoggerAdapter.engine_indexes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.metrics.loggers.make_per_engine", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.metrics.loggers.build_1_2_5_buckets", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.v1.metrics.loggers.PrometheusStatLogger", "methods": [ { "kind": "function", "name": "PrometheusStatLogger.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PrometheusStatLogger.log_metrics_info", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PrometheusStatLogger.record", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PrometheusStatLogger.record_sleep_state", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PrometheusStatLogger.log_engine_initialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PrometheusStatLogger._gauge_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrometheusStatLogger._counter_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrometheusStatLogger._histogram_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrometheusStatLogger._spec_decoding_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrometheusStatLogger._kv_connector_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrometheusStatLogger._perf_metrics_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrometheusStatLogger.engine_indexes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.show_hidden_metrics", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.kv_cache_metrics_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.spec_decoding_prom", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.kv_connector_prom", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.perf_metrics_prom", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.gauge_scheduler_running", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.gauge_scheduler_waiting", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.gauge_engine_sleep_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.gauge_kv_cache_usage", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.counter_prefix_cache_queries", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.counter_prefix_cache_hits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.counter_connector_prefix_cache_queries", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.counter_connector_prefix_cache_hits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.counter_mm_cache_queries", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.counter_mm_cache_hits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.counter_num_preempted_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.counter_prompt_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.counter_prompt_tokens_by_source", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.counter_prompt_tokens_cached", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.counter_prompt_tokens_recomputed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.counter_generation_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.counter_request_success", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_num_prompt_tokens_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_num_generation_tokens_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_iteration_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_max_num_generation_tokens_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_n_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_max_tokens_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_time_to_first_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_inter_token_latency", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_request_time_per_output_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_e2e_time_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_queue_time_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_inference_time_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_prefill_time_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_decode_time_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_prefill_kv_computed_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.gauge_lora_info", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.counter_corrupted_requests", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_kv_block_lifetime", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_kv_block_idle_before_evict", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.histogram_kv_block_reuse_gap", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.labelname_max_lora", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.labelname_waiting_lora_adapters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.labelname_running_lora_adapters", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PrometheusStatLogger.max_lora", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 63, "n_typed": 13, "n_any": 0, "n_untyped": 50, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 54, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.metrics.loggers.PromMetric", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.metrics.loggers.StatLoggerFactory", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.metrics.loggers.AggregateStatLoggerBase", "methods": [ { "kind": "function", "name": "AggregateStatLoggerBase.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.metrics.loggers.PerEngineStatLoggerFactory", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.metrics.loggers.build_buckets", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.v1.metrics.loggers.AggregatedLoggingStatLogger", "methods": [ { "kind": "function", "name": "AggregatedLoggingStatLogger.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AggregatedLoggingStatLogger._enable_perf_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AggregatedLoggingStatLogger.record", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AggregatedLoggingStatLogger.aggregate_scheduler_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AggregatedLoggingStatLogger.log", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AggregatedLoggingStatLogger.log_engine_initialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "AggregatedLoggingStatLogger.log_prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "AggregatedLoggingStatLogger.engine_indexes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AggregatedLoggingStatLogger.last_scheduler_stats_dict", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AggregatedLoggingStatLogger.aggregated", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 8, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_attrs": 3, "n_properties": 1 }, { "kind": "attr", "name": "vllm.v1.metrics.loggers.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.metrics.loggers.StatLoggerManager", "methods": [ { "kind": "function", "name": "StatLoggerManager.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "StatLoggerManager.record", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "StatLoggerManager.record_sleep_state", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StatLoggerManager.log", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StatLoggerManager.log_engine_initialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StatLoggerManager.engine_indexes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StatLoggerManager.stat_loggers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 19, "n_typed": 13, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.loggers.LoggingStatLogger", "methods": [ { "kind": "function", "name": "LoggingStatLogger.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LoggingStatLogger._reset", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoggingStatLogger._enable_perf_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoggingStatLogger._track_iteration_stats", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoggingStatLogger._get_throughput", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LoggingStatLogger.record", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LoggingStatLogger._update_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoggingStatLogger.aggregate_scheduler_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoggingStatLogger.log", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoggingStatLogger.log_engine_initialized", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "LoggingStatLogger.log_prefix", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "LoggingStatLogger.engine_index", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoggingStatLogger.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoggingStatLogger.last_scheduler_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoggingStatLogger.prefix_caching_metrics", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoggingStatLogger.connector_prefix_caching_metrics", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoggingStatLogger.mm_caching_metrics", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoggingStatLogger.spec_decoding_logging", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoggingStatLogger.kv_connector_logging", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoggingStatLogger.cudagraph_logging", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoggingStatLogger.last_prompt_throughput", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoggingStatLogger.last_generation_throughput", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoggingStatLogger.engine_is_idle", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoggingStatLogger.aggregated", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoggingStatLogger.perf_metrics_logging", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 13, "n_any": 0, "n_untyped": 22, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 10, "n_attrs": 14, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.v1.metrics.loggers", "names": [ "vllm.v1.metrics.loggers.AggregateStatLoggerBase", "vllm.v1.metrics.loggers.AggregateStatLoggerFactory", "vllm.v1.metrics.loggers.AggregatedLoggingStatLogger", "vllm.v1.metrics.loggers.LoggingStatLogger", "vllm.v1.metrics.loggers.PerEngineStatLoggerAdapter", "vllm.v1.metrics.loggers.PerEngineStatLoggerFactory", "vllm.v1.metrics.loggers.PromMetric", "vllm.v1.metrics.loggers.PrometheusStatLogger", "vllm.v1.metrics.loggers.StatLoggerBase", "vllm.v1.metrics.loggers.StatLoggerFactory", "vllm.v1.metrics.loggers.StatLoggerManager", "vllm.v1.metrics.loggers.build_1_2_5_buckets", "vllm.v1.metrics.loggers.build_buckets", "vllm.v1.metrics.loggers.load_stat_logger_plugin_factories", "vllm.v1.metrics.loggers.logger", "vllm.v1.metrics.loggers.make_per_engine" ], "n_typable": 175, "n_typed": 77, "n_any": 0, "n_untyped": 98, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 6, "n_methods": 36, "n_method_overloads": 36, "n_method_params": 55, "n_classes": 7, "n_attrs": 80, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/v1/metrics/perf.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.metrics.perf.FfnQuantizationConfigParser", "methods": [ { "kind": "function", "name": "FfnQuantizationConfigParser.parse", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.Parser", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.UnembedMetrics", "methods": [ { "kind": "function", "name": "UnembedMetrics.component_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UnembedMetrics.get_parser", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UnembedMetrics.get_num_flops_breakdown", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "UnembedMetrics.get_read_bytes_breakdown", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "UnembedMetrics.get_write_bytes_breakdown", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "UnembedMetrics.hidden_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UnembedMetrics.vocab_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UnembedMetrics.weight_byte_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UnembedMetrics.activation_byte_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UnembedMetrics.tp_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.PerfStats", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "PerfStats.num_flops_per_gpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PerfStats.num_read_bytes_per_gpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PerfStats.num_write_bytes_per_gpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PerfStats.debug_stats", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.metrics.perf.make_per_engine", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.v1.metrics.perf.PerfMetricsProm", "methods": [ { "kind": "function", "name": "PerfMetricsProm.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PerfMetricsProm.observe", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PerfMetricsProm._counter_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PerfMetricsProm.counter_flops", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerfMetricsProm.counter_read_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerfMetricsProm.counter_write_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 5, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.AttentionMetrics", "methods": [ { "kind": "function", "name": "AttentionMetrics.component_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionMetrics.get_parser", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AttentionMetrics.get_num_flops_breakdown", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AttentionMetrics.get_read_bytes_breakdown", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "AttentionMetrics.get_write_bytes_breakdown", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AttentionMetrics.num_hidden_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionMetrics.hidden_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionMetrics.num_attention_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionMetrics.activation_byte_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionMetrics.tp_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionMetrics.pp_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionMetrics.num_key_value_heads", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionMetrics.head_dim", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionMetrics.cache_byte_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AttentionMetrics.weight_byte_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 21, "n_typed": 21, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.FfnParallelParser", "methods": [ { "kind": "function", "name": "FfnParallelParser.parse", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.BaseConfigParser", "methods": [ { "kind": "function", "name": "BaseConfigParser.parse", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.MoeLayerFreqParser", "methods": [ { "kind": "function", "name": "MoeLayerFreqParser.parse", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.PerfMetricsLogging", "methods": [ { "kind": "function", "name": "PerfMetricsLogging.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PerfMetricsLogging.reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PerfMetricsLogging.observe", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PerfMetricsLogging.log", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PerfMetricsLogging.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerfMetricsLogging.pp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PerfMetricsLogging.debug_logging", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.InvalidComponent", "methods": [], "properties": [], "attrs": [], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.metrics.perf.getattr_from_list", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.v1.metrics.perf.ModelMetrics", "methods": [ { "kind": "function", "name": "ModelMetrics.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ModelMetrics.is_enabled", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelMetrics.get_num_flops", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelMetrics.get_read_bytes", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelMetrics.get_write_bytes", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelMetrics.get_num_flops_breakdown", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelMetrics.get_read_bytes_breakdown", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelMetrics.get_write_bytes_breakdown", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelMetrics.get_step_perf_stats_per_gpu", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelMetrics.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ModelMetrics.metrics", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 25, "n_typed": 24, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 14, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.InterleaveMoeLayerStepParser", "methods": [ { "kind": "function", "name": "InterleaveMoeLayerStepParser.parse", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.BaseAttentionConfigParser", "methods": [ { "kind": "function", "name": "BaseAttentionConfigParser.parse", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.ComponentMetrics", "methods": [ { "kind": "function", "name": "ComponentMetrics.component_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ComponentMetrics.get_parser", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ComponentMetrics.__init_subclass__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ComponentMetrics.from_vllm_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ComponentMetrics.registered_metrics", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ComponentMetrics.get_num_flops_breakdown", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ComponentMetrics.get_read_bytes_breakdown", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ComponentMetrics.get_write_bytes_breakdown", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ComponentMetrics.get_num_flops", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ComponentMetrics.get_read_bytes", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ComponentMetrics.get_write_bytes", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 24, "n_typed": 23, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 13, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.DebugPerfStats", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DebugPerfStats.calc_duration", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DebugPerfStats.num_prefill_requests", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DebugPerfStats.num_decode_requests", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DebugPerfStats.context_breakdown", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DebugPerfStats.num_flops_per_gpu_breakdown", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DebugPerfStats.num_read_bytes_per_gpu_breakdown", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DebugPerfStats.num_write_bytes_per_gpu_breakdown", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.AttentionQuantizationConfigParser", "methods": [ { "kind": "function", "name": "AttentionQuantizationConfigParser.parse", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.ExecutionContext", "methods": [ { "kind": "function", "name": "ExecutionContext.add", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ExecutionContext.total_num_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ExecutionContext.total_token_context_product", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ExecutionContext.num_logits_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ExecutionContext.from_single_request", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExecutionContext.num_prefill_requests", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecutionContext.prefill_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecutionContext.prefill_context_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecutionContext.prefill_token_context_product", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecutionContext.num_decode_requests", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecutionContext.decode_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecutionContext.decode_context_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecutionContext.decode_token_context_product", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.ParsedArgs", "methods": [ { "kind": "function", "name": "ParsedArgs.__getattr__", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParsedArgs.__setattr__", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ParsedArgs.model_dump", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 4, "n_any": 2, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.BaseFfnConfigParser", "methods": [ { "kind": "function", "name": "BaseFfnConfigParser.parse", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.ParserChain", "methods": [ { "kind": "function", "name": "ParserChain.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParserChain.add_parser", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ParserChain.parse", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ParserChain.parsers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.metrics.perf.get_required", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.v1.metrics.perf.FfnMetrics", "methods": [ { "kind": "function", "name": "FfnMetrics.validate_moe_fields", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FfnMetrics.component_type", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FfnMetrics.get_parser", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FfnMetrics.get_num_flops_breakdown", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FfnMetrics.get_read_bytes_breakdown", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FfnMetrics.get_write_bytes_breakdown", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FfnMetrics.num_hidden_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FfnMetrics.hidden_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FfnMetrics.activation_byte_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FfnMetrics.pp_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FfnMetrics.ffn_tp_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FfnMetrics.ffn_ep_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FfnMetrics.intermediate_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FfnMetrics.num_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FfnMetrics.num_experts_per_tok", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FfnMetrics.moe_intermediate_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FfnMetrics.num_shared_experts", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FfnMetrics.num_moe_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FfnMetrics.weight_byte_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 25, "n_typed": 25, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_attrs": 13, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.perf.PerfMetricsDebugLogging", "methods": [ { "kind": "function", "name": "PerfMetricsDebugLogging.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PerfMetricsDebugLogging.reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PerfMetricsDebugLogging.observe", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PerfMetricsDebugLogging.log", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 4, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.metrics.perf.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.metrics.perf", "names": [ "vllm.v1.metrics.perf.AttentionMetrics", "vllm.v1.metrics.perf.AttentionQuantizationConfigParser", "vllm.v1.metrics.perf.BaseAttentionConfigParser", "vllm.v1.metrics.perf.BaseConfigParser", "vllm.v1.metrics.perf.BaseFfnConfigParser", "vllm.v1.metrics.perf.ComponentMetrics", "vllm.v1.metrics.perf.DebugPerfStats", "vllm.v1.metrics.perf.ExecutionContext", "vllm.v1.metrics.perf.FfnMetrics", "vllm.v1.metrics.perf.FfnParallelParser", "vllm.v1.metrics.perf.FfnQuantizationConfigParser", "vllm.v1.metrics.perf.InterleaveMoeLayerStepParser", "vllm.v1.metrics.perf.InvalidComponent", "vllm.v1.metrics.perf.ModelMetrics", "vllm.v1.metrics.perf.MoeLayerFreqParser", "vllm.v1.metrics.perf.ParsedArgs", "vllm.v1.metrics.perf.Parser", "vllm.v1.metrics.perf.ParserChain", "vllm.v1.metrics.perf.PerfMetricsDebugLogging", "vllm.v1.metrics.perf.PerfMetricsLogging", "vllm.v1.metrics.perf.PerfMetricsProm", "vllm.v1.metrics.perf.PerfStats", "vllm.v1.metrics.perf.UnembedMetrics", "vllm.v1.metrics.perf.get_required", "vllm.v1.metrics.perf.getattr_from_list", "vllm.v1.metrics.perf.logger", "vllm.v1.metrics.perf.make_per_engine" ], "n_typable": 199, "n_typed": 176, "n_any": 2, "n_untyped": 21, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 7, "n_methods": 65, "n_method_overloads": 65, "n_method_params": 86, "n_classes": 23, "n_attrs": 58, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/metrics/prometheus.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.metrics.prometheus.unregister_vllm_metrics", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.v1.metrics.prometheus.get_prometheus_registry", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.v1.metrics.prometheus.shutdown_prometheus", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.v1.metrics.prometheus.setup_multiprocess_prometheus", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.v1.metrics.prometheus.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.metrics.prometheus", "names": [ "vllm.v1.metrics.prometheus.get_prometheus_registry", "vllm.v1.metrics.prometheus.logger", "vllm.v1.metrics.prometheus.setup_multiprocess_prometheus", "vllm.v1.metrics.prometheus.shutdown_prometheus", "vllm.v1.metrics.prometheus.unregister_vllm_metrics" ], "n_typable": 5, "n_typed": 1, "n_any": 0, "n_untyped": 4, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/metrics/ray_wrappers.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.metrics.ray_wrappers.RayPrometheusMetric", "methods": [ { "kind": "function", "name": "RayPrometheusMetric.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RayPrometheusMetric._get_tag_keys", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RayPrometheusMetric.labels", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "RayPrometheusMetric._get_sanitized_opentelemetry_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RayPrometheusMetric.metric", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 9, "n_typed": 5, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.metrics.ray_wrappers.ray_metrics", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.metrics.ray_wrappers.RayCounterWrapper", "methods": [ { "kind": "function", "name": "RayCounterWrapper.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RayCounterWrapper.inc", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.ray_wrappers.RayPerfMetricsProm", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RayPerfMetricsProm._counter_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.ray_wrappers.RayGaugeWrapper", "methods": [ { "kind": "function", "name": "RayGaugeWrapper.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "RayGaugeWrapper.set", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RayGaugeWrapper.set_to_current_time", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.ray_wrappers.RayHistogramWrapper", "methods": [ { "kind": "function", "name": "RayHistogramWrapper.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "RayHistogramWrapper.observe", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.ray_wrappers.RayPrometheusStatLogger", "methods": [ { "kind": "function", "name": "RayPrometheusStatLogger._unregister_vllm_metrics", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RayPrometheusStatLogger._gauge_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RayPrometheusStatLogger._counter_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RayPrometheusStatLogger._histogram_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RayPrometheusStatLogger._spec_decoding_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RayPrometheusStatLogger._kv_connector_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RayPrometheusStatLogger._perf_metrics_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.ray_wrappers.RayKVConnectorPrometheus", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RayKVConnectorPrometheus._gauge_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RayKVConnectorPrometheus._counter_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RayKVConnectorPrometheus._histogram_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.ray_wrappers.RaySpecDecodingProm", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RaySpecDecodingProm._counter_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.metrics.ray_wrappers.ray_serve", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.v1.metrics.ray_wrappers", "names": [ "vllm.v1.metrics.ray_wrappers.RayCounterWrapper", "vllm.v1.metrics.ray_wrappers.RayGaugeWrapper", "vllm.v1.metrics.ray_wrappers.RayHistogramWrapper", "vllm.v1.metrics.ray_wrappers.RayKVConnectorPrometheus", "vllm.v1.metrics.ray_wrappers.RayPerfMetricsProm", "vllm.v1.metrics.ray_wrappers.RayPrometheusMetric", "vllm.v1.metrics.ray_wrappers.RayPrometheusStatLogger", "vllm.v1.metrics.ray_wrappers.RaySpecDecodingProm", "vllm.v1.metrics.ray_wrappers.ray_metrics", "vllm.v1.metrics.ray_wrappers.ray_serve" ], "n_typable": 31, "n_typed": 19, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 18, "n_classes": 8, "n_attrs": 14, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/metrics/reader.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.metrics.reader.Histogram", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Histogram.count", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Histogram.sum", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Histogram.buckets", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.reader.Counter", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Counter.value", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.metrics.reader.get_metrics_snapshot", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "class", "name": "vllm.v1.metrics.reader.Gauge", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Gauge.value", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.reader.Vector", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Vector.values", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.reader.Metric", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Metric.name", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Metric.labels", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.metrics.reader", "names": [ "vllm.v1.metrics.reader.Counter", "vllm.v1.metrics.reader.Gauge", "vllm.v1.metrics.reader.Histogram", "vllm.v1.metrics.reader.Metric", "vllm.v1.metrics.reader.Vector", "vllm.v1.metrics.reader.get_metrics_snapshot" ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 5, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/metrics/stats.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.metrics.stats.KVCacheEvictionEvent", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "KVCacheEvictionEvent.lifetime_seconds", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVCacheEvictionEvent.idle_seconds", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVCacheEvictionEvent.reuse_gaps_seconds", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.stats.IterationStats", "methods": [ { "kind": "function", "name": "IterationStats.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "IterationStats.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "IterationStats._time_since", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "IterationStats.update_from_output", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "IterationStats.update_from_events", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "IterationStats.update_from_finished_request", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [ { "kind": "property", "name": "IterationStats.num_prompt_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "IterationStats.iteration_timestamp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IterationStats.num_generation_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IterationStats.prompt_token_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IterationStats.num_preempted_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "IterationStats.finished_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "IterationStats.max_num_generation_tokens_iter", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "IterationStats.n_params_iter", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "IterationStats.time_to_first_tokens_iter", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "IterationStats.inter_token_latencies_iter", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "IterationStats.num_corrupted_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 36, "n_typed": 28, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 19, "n_attrs": 10, "n_properties": 1 }, { "kind": "class", "name": "vllm.v1.metrics.stats.MultiModalCacheStats", "methods": [ { "kind": "function", "name": "MultiModalCacheStats.record", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.stats.FinishedRequestStats", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "FinishedRequestStats.finish_reason", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FinishedRequestStats.e2e_latency", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FinishedRequestStats.num_prompt_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FinishedRequestStats.num_generation_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FinishedRequestStats.max_tokens_param", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FinishedRequestStats.queued_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FinishedRequestStats.prefill_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FinishedRequestStats.inference_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FinishedRequestStats.decode_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FinishedRequestStats.mean_time_per_output_token", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FinishedRequestStats.is_corrupted", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FinishedRequestStats.num_cached_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 12, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.stats.PromptTokenStats", "methods": [ { "kind": "function", "name": "PromptTokenStats.update_from_output", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PromptTokenStats.get_by_source", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PromptTokenStats.ALL_SOURCES", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PromptTokenStats.computed", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PromptTokenStats.local_cache_hit", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PromptTokenStats.external_kv_transfer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PromptTokenStats.cached_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PromptTokenStats.recomputed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PromptTokenStats.total", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.stats.LoRARequestStates", "methods": [ { "kind": "function", "name": "LoRARequestStates.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRARequestStates._request_update", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LoRARequestStates.request_waiting", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LoRARequestStates.request_running", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LoRARequestStates.request_finished", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LoRARequestStates.update_scheduler_stats", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LoRARequestStates.log_stats", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoRARequestStates.requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 20, "n_typed": 13, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 12, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.stats.BaseCacheStats", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "BaseCacheStats.reset", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseCacheStats.requests", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseCacheStats.queries", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BaseCacheStats.hits", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.stats.CachingMetrics", "methods": [ { "kind": "function", "name": "CachingMetrics.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CachingMetrics.observe", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CachingMetrics.reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "CachingMetrics.empty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "CachingMetrics.hit_rate", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "CachingMetrics.max_recent_requests", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CachingMetrics.aggregated_requests", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CachingMetrics.aggregated_query_total", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CachingMetrics.aggregated_query_hit", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CachingMetrics.query_queue", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 5, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 5, "n_properties": 2 }, { "kind": "class", "name": "vllm.v1.metrics.stats.PrefixCacheStats", "methods": [ { "kind": "function", "name": "PrefixCacheStats.record", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PrefixCacheStats.preempted_requests", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrefixCacheStats.preempted_queries", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PrefixCacheStats.preempted_hits", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.stats.SchedulerStats", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SchedulerStats.num_running_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerStats.num_waiting_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerStats.step_counter", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerStats.current_wave", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerStats.kv_cache_usage", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerStats.encoder_cache_usage", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerStats.prefix_cache_stats", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerStats.connector_prefix_cache_stats", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerStats.kv_cache_eviction_events", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerStats.spec_decoding_stats", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerStats.kv_connector_stats", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerStats.waiting_lora_adapters", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerStats.running_lora_adapters", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerStats.cudagraph_stats", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SchedulerStats.perf_stats", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 15, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.stats.RequestStateStats", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "RequestStateStats.num_generation_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStateStats.arrival_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStateStats.queued_ts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStateStats.scheduled_ts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStateStats.first_token_ts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStateStats.last_token_ts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStateStats.first_token_latency", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStateStats.is_corrupted", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.metrics.stats.LoRAStats", "methods": [ { "kind": "function", "name": "LoRAStats.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoRAStats.update", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [ { "kind": "property", "name": "LoRAStats.empty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "LoRAStats.waiting", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LoRAStats.running", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 2, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.v1.metrics.stats", "names": [ "vllm.v1.metrics.stats.BaseCacheStats", "vllm.v1.metrics.stats.CachingMetrics", "vllm.v1.metrics.stats.FinishedRequestStats", "vllm.v1.metrics.stats.IterationStats", "vllm.v1.metrics.stats.KVCacheEvictionEvent", "vllm.v1.metrics.stats.LoRARequestStates", "vllm.v1.metrics.stats.LoRAStats", "vllm.v1.metrics.stats.MultiModalCacheStats", "vllm.v1.metrics.stats.PrefixCacheStats", "vllm.v1.metrics.stats.PromptTokenStats", "vllm.v1.metrics.stats.RequestStateStats", "vllm.v1.metrics.stats.SchedulerStats" ], "n_typable": 89, "n_typed": 65, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 21, "n_method_overloads": 21, "n_method_params": 45, "n_classes": 12, "n_attrs": 71, "n_properties": 4, "n_type_ignores": 0 }, { "path": "vllm/v1/outputs.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.outputs.ModelRunnerOutput", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ModelRunnerOutput.req_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelRunnerOutput.req_id_to_index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelRunnerOutput.sampled_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelRunnerOutput.logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelRunnerOutput.prompt_logprobs_dict", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelRunnerOutput.pooler_output", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelRunnerOutput.kv_connector_output", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelRunnerOutput.ec_connector_output", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelRunnerOutput.num_nans_in_logits", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ModelRunnerOutput.cudagraph_stats", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.outputs.SamplerOutput", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SamplerOutput.sampled_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplerOutput.logprobs_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.outputs.DraftTokenIds", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "DraftTokenIds.req_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "DraftTokenIds.draft_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.outputs.KVConnectorStats", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.outputs.T", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.outputs.EMPTY_MODEL_RUNNER_OUTPUT", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.outputs.LogprobsTensors", "methods": [ { "kind": "function", "name": "LogprobsTensors.tolists", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LogprobsTensors.to_cpu_nonblocking", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LogprobsTensors.filter", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LogprobsTensors.empty_cpu", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LogprobsTensors.logprob_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LogprobsTensors.logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LogprobsTensors.selected_token_ranks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LogprobsTensors.cu_num_generated_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 8, "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.outputs.make_empty_encoder_model_runner_output", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.v1.outputs.LogprobsLists", "methods": [ { "kind": "function", "name": "LogprobsLists.slice_request", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LogprobsLists.logprob_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LogprobsLists.logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LogprobsLists.sampled_token_ranks", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LogprobsLists.cu_num_generated_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.outputs.AsyncModelRunnerOutput", "methods": [ { "kind": "function", "name": "AsyncModelRunnerOutput.get_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.outputs.KVConnectorKVEvents", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.outputs.KVConnectorOutput", "methods": [ { "kind": "function", "name": "KVConnectorOutput.is_empty", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorOutput.merge", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KVConnectorOutput.finished_sending", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVConnectorOutput.finished_recving", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVConnectorOutput.kv_connector_stats", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVConnectorOutput.kv_cache_events", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVConnectorOutput.invalid_block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "KVConnectorOutput.expected_finished_count", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.outputs.ECConnectorOutput", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ECConnectorOutput.finished_sending", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ECConnectorOutput.finished_recving", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.outputs.PoolerOutput", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.outputs", "names": [ "vllm.v1.outputs.AsyncModelRunnerOutput", "vllm.v1.outputs.DraftTokenIds", "vllm.v1.outputs.ECConnectorOutput", "vllm.v1.outputs.EMPTY_MODEL_RUNNER_OUTPUT", "vllm.v1.outputs.KVConnectorKVEvents", "vllm.v1.outputs.KVConnectorOutput", "vllm.v1.outputs.KVConnectorStats", "vllm.v1.outputs.LogprobsLists", "vllm.v1.outputs.LogprobsTensors", "vllm.v1.outputs.ModelRunnerOutput", "vllm.v1.outputs.PoolerOutput", "vllm.v1.outputs.SamplerOutput", "vllm.v1.outputs.T", "vllm.v1.outputs.make_empty_encoder_model_runner_output" ], "n_typable": 19, "n_typed": 14, "n_any": 0, "n_untyped": 5, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 7, "n_classes": 8, "n_attrs": 35, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/pool/metadata.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.pool.metadata.PoolingCursor", "methods": [ { "kind": "function", "name": "PoolingCursor.__getitem__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingCursor.is_partial_prefill", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PoolingCursor.is_finished", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingCursor.index", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingCursor.first_token_indices_gpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingCursor.last_token_indices_gpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingCursor.prompt_lens_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingCursor.seq_lens_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingCursor.num_scheduled_tokens_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.pool.metadata.PoolingMetadata", "methods": [ { "kind": "function", "name": "PoolingMetadata.__post_init__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PoolingMetadata.__getitem__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingMetadata.get_prompt_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PoolingMetadata.get_pooling_cursor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PoolingMetadata.build_pooling_cursor", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingMetadata.prompt_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingMetadata.prompt_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingMetadata.pooling_params", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingMetadata.pooling_states", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PoolingMetadata.pooling_cursor", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 9, "n_typed": 7, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 4, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.pool.metadata.pin_memory", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.pool.metadata.PoolingStates", "methods": [ { "kind": "function", "name": "PoolingStates.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PoolingStates.clean", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingStates.hidden_states_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 3, "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.pool.metadata", "names": [ "vllm.v1.pool.metadata.PoolingCursor", "vllm.v1.pool.metadata.PoolingMetadata", "vllm.v1.pool.metadata.PoolingStates", "vllm.v1.pool.metadata.pin_memory" ], "n_typable": 17, "n_typed": 9, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 5, "n_classes": 3, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/request.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.request.StreamingUpdate", "methods": [ { "kind": "function", "name": "StreamingUpdate.from_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StreamingUpdate.mm_features", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingUpdate.prompt_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingUpdate.max_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingUpdate.arrival_time", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StreamingUpdate.sampling_params", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.request.Request", "methods": [ { "kind": "function", "name": "Request.__init__", "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "Request.from_engine_core_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Request.append_output_token_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Request.update_block_hashes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Request.get_skip_reading_prefix_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Request.is_finished", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Request.get_finished_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Request.get_num_encoder_embeds", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Request.record_event", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Request.take_events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Request.__lt__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "Request.eos_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Request.use_structured_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Request.num_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Request.num_tokens_with_spec", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Request.num_output_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Request.num_encoder_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "Request.has_encoder_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "Request.request_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.client_index", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.priority", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.sampling_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.pooling_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.lora_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.structured_output_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.arrival_time", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.status", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.events", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Request.stop_reason", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Request.kv_transfer_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Request.prompt_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.prompt_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.num_prompt_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.num_output_placeholders", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.discard_latest_async_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.spec_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Request.num_computed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.cache_salt", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Request.mm_features", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.output_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.all_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.trace_headers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.num_cached_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.is_prefill_chunk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.num_nans_in_logits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.num_preemptions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.num_external_computed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.block_hashes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Request.skip_reading_prefix_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.resumable", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Request.streaming_queue", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Request.max_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 74, "n_typed": 47, "n_any": 0, "n_untyped": 27, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 22, "n_attrs": 34, "n_properties": 7 }, { "kind": "class", "name": "vllm.v1.request.RequestStatus", "methods": [ { "kind": "function", "name": "RequestStatus.__str__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RequestStatus.is_finished", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RequestStatus.get_finished_reason", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RequestStatus.WAITING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStatus.WAITING_FOR_FSM", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStatus.WAITING_FOR_REMOTE_KVS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStatus.WAITING_FOR_STREAMING_REQ", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStatus.RUNNING", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStatus.PREEMPTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStatus.FINISHED_STOPPED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStatus.FINISHED_LENGTH_CAPPED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStatus.FINISHED_ABORTED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStatus.FINISHED_IGNORED", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStatus.FINISHED_ERROR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "RequestStatus.FINISHED_REPETITION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 2, "n_attrs": 12, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.request", "names": [ "vllm.v1.request.Request", "vllm.v1.request.RequestStatus", "vllm.v1.request.StreamingUpdate" ], "n_typable": 81, "n_typed": 54, "n_any": 0, "n_untyped": 27, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 25, "n_classes": 3, "n_attrs": 51, "n_properties": 7, "n_type_ignores": 0 }, { "path": "vllm/v1/sample/logits_processor/__init__.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.sample.logits_processor.STR_POOLING_REJECTS_LOGITSPROCS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.sample.logits_processor.build_logitsprocs", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.v1.sample.logits_processor.AdapterLogitsProcessor", "methods": [ { "kind": "function", "name": "AdapterLogitsProcessor.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AdapterLogitsProcessor.new_req_logits_processor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AdapterLogitsProcessor._new_state", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AdapterLogitsProcessor.update_state", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "AdapterLogitsProcessor.apply", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AdapterLogitsProcessor.req_info", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 15, "n_typed": 13, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.sample.logits_processor.LOGITSPROCS_GROUP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.v1.sample.logits_processor", "names": [ "vllm.v1.sample.logits_processor.AdapterLogitsProcessor", "vllm.v1.sample.logits_processor.LOGITSPROCS_GROUP", "vllm.v1.sample.logits_processor.STR_POOLING_REJECTS_LOGITSPROCS", "vllm.v1.sample.logits_processor.build_logitsprocs" ], "n_typable": 21, "n_typed": 19, "n_any": 0, "n_untyped": 2, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 5, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 9, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/sample/logits_processor/builtin.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.sample.logits_processor.builtin.MinPLogitsProcessor", "methods": [ { "kind": "function", "name": "MinPLogitsProcessor.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MinPLogitsProcessor.is_argmax_invariant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MinPLogitsProcessor.get_min_p_by_index", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinPLogitsProcessor.update_state", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinPLogitsProcessor.apply", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MinPLogitsProcessor.min_p_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinPLogitsProcessor.min_p_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinPLogitsProcessor.min_p_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinPLogitsProcessor.use_double_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinPLogitsProcessor.min_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinPLogitsProcessor.min_p_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 17, "n_typed": 12, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.sample.logits_processor.builtin.MinTokensLogitsProcessor", "methods": [ { "kind": "function", "name": "MinTokensLogitsProcessor.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MinTokensLogitsProcessor.is_argmax_invariant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MinTokensLogitsProcessor.add_request", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MinTokensLogitsProcessor.update_state", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinTokensLogitsProcessor._device_tensor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MinTokensLogitsProcessor.apply", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MinTokensLogitsProcessor.apply_with_spec_decode", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MinTokensLogitsProcessor.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinTokensLogitsProcessor.pin_memory", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MinTokensLogitsProcessor.min_toks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinTokensLogitsProcessor.logits_slice", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MinTokensLogitsProcessor.neg_inf_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 24, "n_typed": 19, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 12, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.sample.logits_processor.builtin.LogitBiasLogitsProcessor", "methods": [ { "kind": "function", "name": "LogitBiasLogitsProcessor.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LogitBiasLogitsProcessor.is_argmax_invariant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LogitBiasLogitsProcessor.update_state", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LogitBiasLogitsProcessor._device_tensor", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LogitBiasLogitsProcessor.apply", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LogitBiasLogitsProcessor.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasLogitsProcessor.pin_memory", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasLogitsProcessor.biases", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasLogitsProcessor.bias_tensor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasLogitsProcessor.logits_slice", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 11, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 7, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.sample.logits_processor.builtin.process_dict_updates", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.v1.sample.logits_processor.builtin.T", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.v1.sample.logits_processor.builtin", "names": [ "vllm.v1.sample.logits_processor.builtin.LogitBiasLogitsProcessor", "vllm.v1.sample.logits_processor.builtin.MinPLogitsProcessor", "vllm.v1.sample.logits_processor.builtin.MinTokensLogitsProcessor", "vllm.v1.sample.logits_processor.builtin.T", "vllm.v1.sample.logits_processor.builtin.process_dict_updates" ], "n_typable": 62, "n_typed": 46, "n_any": 0, "n_untyped": 16, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 25, "n_classes": 3, "n_attrs": 17, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/sample/logits_processor/interface.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.sample.logits_processor.interface.LogitsProcessor", "methods": [ { "kind": "function", "name": "LogitsProcessor.validate_params", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LogitsProcessor.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LogitsProcessor.apply", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LogitsProcessor.is_argmax_invariant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LogitsProcessor.update_state", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 11, "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.sample.logits_processor.interface.BatchUpdate", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "BatchUpdate.batch_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BatchUpdate.removed", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BatchUpdate.added", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BatchUpdate.moved", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.sample.logits_processor.interface.MoveDirectionality", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MoveDirectionality.UNIDIRECTIONAL", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MoveDirectionality.SWAP", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.sample.logits_processor.interface.RemovedRequest", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.sample.logits_processor.interface.MovedRequest", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.sample.logits_processor.interface.AddedRequest", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.v1.sample.logits_processor.interface", "names": [ "vllm.v1.sample.logits_processor.interface.AddedRequest", "vllm.v1.sample.logits_processor.interface.BatchUpdate", "vllm.v1.sample.logits_processor.interface.LogitsProcessor", "vllm.v1.sample.logits_processor.interface.MoveDirectionality", "vllm.v1.sample.logits_processor.interface.MovedRequest", "vllm.v1.sample.logits_processor.interface.RemovedRequest" ], "n_typable": 11, "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 6, "n_classes": 3, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/sample/logits_processor/state.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.sample.logits_processor.state.BatchUpdateBuilder", "methods": [ { "kind": "function", "name": "BatchUpdateBuilder.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BatchUpdateBuilder._ensure_removed_sorted", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchUpdateBuilder.removed_append", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BatchUpdateBuilder.has_removed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchUpdateBuilder.peek_removed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchUpdateBuilder.pop_removed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchUpdateBuilder.reset", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BatchUpdateBuilder.get_and_reset", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "BatchUpdateBuilder.removed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "BatchUpdateBuilder._removed", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchUpdateBuilder._is_removed_sorted", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchUpdateBuilder.added", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchUpdateBuilder.moved", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BatchUpdateBuilder.batch_changed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 19, "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 5, "n_attrs": 5, "n_properties": 1 }, { "kind": "class", "name": "vllm.v1.sample.logits_processor.state.LogitsProcessors", "methods": [ { "kind": "function", "name": "LogitsProcessors.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "LogitsProcessors.all", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "LogitsProcessors.argmax_invariant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "LogitsProcessors.non_argmax_invariant", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 2, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.v1.sample.logits_processor.state", "names": [ "vllm.v1.sample.logits_processor.state.BatchUpdateBuilder", "vllm.v1.sample.logits_processor.state.LogitsProcessors" ], "n_typable": 24, "n_typed": 23, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 6, "n_classes": 2, "n_attrs": 7, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/v1/sample/metadata.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.sample.metadata.SamplingMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SamplingMetadata.temperature", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.all_greedy", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.all_random", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.top_p", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.top_k", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.generators", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.max_num_logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.no_penalties", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.prompt_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.frequency_penalties", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.presence_penalties", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.repetition_penalties", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.output_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.allowed_token_ids_mask", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.bad_words_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.logitsprocs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplingMetadata.spec_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 17, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.sample.metadata", "names": [ "vllm.v1.sample.metadata.SamplingMetadata" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 17, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/sample/ops/bad_words.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.sample.ops.bad_words.apply_bad_words_with_drafts", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.v1.sample.ops.bad_words.apply_bad_words", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.v1.sample.ops.bad_words", "names": [ "vllm.v1.sample.ops.bad_words.apply_bad_words", "vllm.v1.sample.ops.bad_words.apply_bad_words_with_drafts" ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/sample/ops/logprobs.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.sample.ops.logprobs.batched_count_greater_than", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.v1.sample.ops.logprobs", "names": [ "vllm.v1.sample.ops.logprobs.batched_count_greater_than" ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/sample/ops/penalties.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.sample.ops.penalties.apply_all_penalties", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.v1.sample.ops.penalties", "names": [ "vllm.v1.sample.ops.penalties.apply_all_penalties" ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/sample/ops/topk_topp_sampler.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.sample.ops.topk_topp_sampler.random_sample", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.v1.sample.ops.topk_topp_sampler.TopKTopPSampler", "methods": [ { "kind": "function", "name": "TopKTopPSampler.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "TopKTopPSampler.forward_native", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "TopKTopPSampler.forward_cuda", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "TopKTopPSampler.forward_cpu", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "TopKTopPSampler.forward_hip", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "TopKTopPSampler.aiter_sample", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "TopKTopPSampler.logprobs_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TopKTopPSampler.forward", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "TopKTopPSampler.aiter_ops", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 30, "n_typed": 27, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 21, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.sample.ops.topk_topp_sampler.compiled_random_sample", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.sample.ops.topk_topp_sampler.apply_top_k_top_p", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.sample.ops.topk_topp_sampler.apply_top_k_top_p_pytorch", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.v1.sample.ops.topk_topp_sampler.flashinfer_sample", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.v1.sample.ops.topk_topp_sampler.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.sample.ops.topk_topp_sampler.apply_top_k_only", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.v1.sample.ops.topk_topp_sampler", "names": [ "vllm.v1.sample.ops.topk_topp_sampler.TopKTopPSampler", "vllm.v1.sample.ops.topk_topp_sampler.apply_top_k_only", "vllm.v1.sample.ops.topk_topp_sampler.apply_top_k_top_p", "vllm.v1.sample.ops.topk_topp_sampler.apply_top_k_top_p_pytorch", "vllm.v1.sample.ops.topk_topp_sampler.compiled_random_sample", "vllm.v1.sample.ops.topk_topp_sampler.flashinfer_sample", "vllm.v1.sample.ops.topk_topp_sampler.logger", "vllm.v1.sample.ops.topk_topp_sampler.random_sample" ], "n_typable": 53, "n_typed": 49, "n_any": 0, "n_untyped": 4, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 16, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 21, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/sample/ops/topk_topp_triton.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.sample.ops.topk_topp_triton.reset_buffer_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.v1.sample.ops.topk_topp_triton.apply_top_k_top_p_triton", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "type_ignores": [], "name": "vllm.v1.sample.ops.topk_topp_triton", "names": [ "vllm.v1.sample.ops.topk_topp_triton.apply_top_k_top_p_triton", "vllm.v1.sample.ops.topk_topp_triton.reset_buffer_cache" ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 4, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/sample/rejection_sampler.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.sample.rejection_sampler.rejection_random_sample_kernel", "n_typed": 1, "n_any": 0, "n_untyped": 12, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "vllm.v1.sample.rejection_sampler.generate_uniform_probs", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.v1.sample.rejection_sampler.expand_batch_to_tokens", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.v1.sample.rejection_sampler.sample_recovered_tokens", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.v1.sample.rejection_sampler.rejection_greedy_sample_kernel", "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "attr", "name": "vllm.v1.sample.rejection_sampler.GREEDY_TEMPERATURE", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.sample.rejection_sampler.MAX_SPEC_LEN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.sample.rejection_sampler.rejection_sample", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "class", "name": "vllm.v1.sample.rejection_sampler.RejectionSampler", "methods": [ { "kind": "function", "name": "RejectionSampler.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RejectionSampler.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "RejectionSampler._get_logprobs_tensors", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "RejectionSampler.parse_output", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "RejectionSampler.apply_logits_processors", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "RejectionSampler.apply_penalties", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "RejectionSampler._combine_outputs_with_spec_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "RejectionSampler.sampler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RejectionSampler.is_processed_logprobs_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RejectionSampler.is_logits_logprobs_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 35, "n_typed": 31, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 25, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.sample.rejection_sampler.PLACEHOLDER_TOKEN_ID", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.sample.rejection_sampler.apply_sampling_constraints", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.v1.sample.rejection_sampler.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.sample.rejection_sampler.sample_recovered_tokens_kernel", "n_typed": 2, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.v1.sample.rejection_sampler.expand_kernel", "n_typed": 1, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.v1.sample.rejection_sampler", "names": [ "vllm.v1.sample.rejection_sampler.GREEDY_TEMPERATURE", "vllm.v1.sample.rejection_sampler.MAX_SPEC_LEN", "vllm.v1.sample.rejection_sampler.PLACEHOLDER_TOKEN_ID", "vllm.v1.sample.rejection_sampler.RejectionSampler", "vllm.v1.sample.rejection_sampler.apply_sampling_constraints", "vllm.v1.sample.rejection_sampler.expand_batch_to_tokens", "vllm.v1.sample.rejection_sampler.expand_kernel", "vllm.v1.sample.rejection_sampler.generate_uniform_probs", "vllm.v1.sample.rejection_sampler.logger", "vllm.v1.sample.rejection_sampler.rejection_greedy_sample_kernel", "vllm.v1.sample.rejection_sampler.rejection_random_sample_kernel", "vllm.v1.sample.rejection_sampler.rejection_sample", "vllm.v1.sample.rejection_sampler.sample_recovered_tokens", "vllm.v1.sample.rejection_sampler.sample_recovered_tokens_kernel" ], "n_typable": 109, "n_typed": 70, "n_any": 0, "n_untyped": 39, "n_functions": 9, "n_function_overloads": 9, "n_function_params": 62, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 25, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/sample/sampler.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.sample.sampler.Sampler", "methods": [ { "kind": "function", "name": "Sampler.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Sampler.forward", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Sampler.apply_temperature", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Sampler.greedy_sample", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Sampler.sample", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Sampler.compute_logprobs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Sampler.gather_logprobs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Sampler._combine_outputs_with_spec_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Sampler.apply_logits_processors", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Sampler.apply_penalties", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Sampler.topk_topp_sampler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Sampler.pin_memory", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Sampler.logprobs_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 37, "n_typed": 33, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 24, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.sample.sampler", "names": [ "vllm.v1.sample.sampler.Sampler" ], "n_typable": 37, "n_typed": 33, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 24, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/serial_utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.serial_utils.MMF_CLASS_TO_FACTORY", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.serial_utils.CUSTOM_TYPE_CLOUDPICKLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.serial_utils.CUSTOM_TYPE_RAW_VIEW", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.serial_utils.UtilityResult", "methods": [ { "kind": "function", "name": "UtilityResult.__init__", "n_typed": 0, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "UtilityResult.result", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 3, "n_typed": 0, "n_any": 1, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.serial_utils.PydanticMsgspecMixin", "methods": [ { "kind": "function", "name": "PydanticMsgspecMixin.__get_pydantic_core_schema__", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PydanticMsgspecMixin._validate_msgspec", "n_typed": 0, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 5, "n_typed": 2, "n_any": 3, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.serial_utils.CUSTOM_TYPE_PICKLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.serial_utils.run_method", "n_typed": 3, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.v1.serial_utils.bytestr", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.serial_utils.MsgpackEncoder", "methods": [ { "kind": "function", "name": "MsgpackEncoder.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackEncoder.encode", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackEncoder.encode_into", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MsgpackEncoder.enc_hook", "n_typed": 0, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackEncoder._encode_ndarray", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackEncoder._encode_tensor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackEncoder._encode_mm_items", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackEncoder._encode_mm_item", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackEncoder._encode_mm_field_elem", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackEncoder._encode_nested_tensors", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackEncoder._encode_mm_field", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MsgpackEncoder.encoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MsgpackEncoder.aux_buffers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "MsgpackEncoder.size_threshold", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 26, "n_typed": 17, "n_any": 5, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 12, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.serial_utils.MsgpackDecoder", "methods": [ { "kind": "function", "name": "MsgpackDecoder.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MsgpackDecoder.decode", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackDecoder.dec_hook", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MsgpackDecoder._decode_utility_result", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackDecoder._convert_result", "n_typed": 1, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MsgpackDecoder._decode_ndarray", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackDecoder._decode_tensor", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackDecoder._decode_mm_items", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackDecoder._decode_mm_item", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackDecoder._decode_mm_field_elem", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackDecoder._decode_nested_tensors", "n_typed": 1, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackDecoder._decode_nested_slices", "n_typed": 0, "n_any": 2, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MsgpackDecoder.ext_hook", "n_typed": 2, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MsgpackDecoder.share_mem", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MsgpackDecoder.pin_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MsgpackDecoder.decoder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MsgpackDecoder.aux_buffers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 34, "n_typed": 18, "n_any": 12, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 17, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.serial_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.serial_utils", "names": [ "vllm.v1.serial_utils.CUSTOM_TYPE_CLOUDPICKLE", "vllm.v1.serial_utils.CUSTOM_TYPE_PICKLE", "vllm.v1.serial_utils.CUSTOM_TYPE_RAW_VIEW", "vllm.v1.serial_utils.MMF_CLASS_TO_FACTORY", "vllm.v1.serial_utils.MsgpackDecoder", "vllm.v1.serial_utils.MsgpackEncoder", "vllm.v1.serial_utils.PydanticMsgspecMixin", "vllm.v1.serial_utils.UtilityResult", "vllm.v1.serial_utils.bytestr", "vllm.v1.serial_utils.logger", "vllm.v1.serial_utils.run_method" ], "n_typable": 76, "n_typed": 42, "n_any": 23, "n_untyped": 11, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 27, "n_method_overloads": 27, "n_method_params": 33, "n_classes": 4, "n_attrs": 14, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/spec_decode/draft_model.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.spec_decode.draft_model.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.spec_decode.draft_model.DraftModelProposer", "methods": [ { "kind": "function", "name": "DraftModelProposer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DraftModelProposer._raise_if_vocab_size_mismatch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DraftModelProposer._raise_if_draft_tp_mismatch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DraftModelProposer._get_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DraftModelProposer._maybe_share_embeddings", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DraftModelProposer._maybe_share_lm_head", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.spec_decode.draft_model", "names": [ "vllm.v1.spec_decode.draft_model.DraftModelProposer", "vllm.v1.spec_decode.draft_model.logger" ], "n_typable": 12, "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 5, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/spec_decode/eagle.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.spec_decode.eagle.SpecDecodeBaseProposer", "methods": [ { "kind": "function", "name": "SpecDecodeBaseProposer.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SpecDecodeBaseProposer._raise_if_padded_drafter_batch_disabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpecDecodeBaseProposer._raise_if_multimodal", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpecDecodeBaseProposer._raise_if_mrope", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpecDecodeBaseProposer._init_parallel_drafting_params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpecDecodeBaseProposer._get_positions", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SpecDecodeBaseProposer._set_positions", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SpecDecodeBaseProposer._get_slot_mapping", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SpecDecodeBaseProposer.initialize_cudagraph_keys", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SpecDecodeBaseProposer._greedy_sample", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SpecDecodeBaseProposer.propose", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "SpecDecodeBaseProposer.set_inputs_first_pass", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "SpecDecodeBaseProposer.model_returns_tuple", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpecDecodeBaseProposer.prepare_next_token_ids_cpu", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SpecDecodeBaseProposer.prepare_next_token_ids_padded", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "SpecDecodeBaseProposer.prepare_inputs_padded", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SpecDecodeBaseProposer.propose_tree", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "SpecDecodeBaseProposer.prepare_inputs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SpecDecodeBaseProposer.get_model_name", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SpecDecodeBaseProposer._get_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpecDecodeBaseProposer.load_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SpecDecodeBaseProposer._maybe_share_embeddings", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SpecDecodeBaseProposer._maybe_share_lm_head", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SpecDecodeBaseProposer.dummy_run", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SpecDecodeBaseProposer._get_eagle3_use_aux_hidden_state_from_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpecDecodeBaseProposer.validate_same_kv_cache_group", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SpecDecodeBaseProposer.initialize_attn_backend", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SpecDecodeBaseProposer._determine_batch_execution_and_padding", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SpecDecodeBaseProposer.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.speculative_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.draft_model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.pass_hidden_states_to_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.runner", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.dp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.num_speculative_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.inputs_embeds_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.parallel_drafting", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.extra_slots_per_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.net_num_new_slots_per_request", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.needs_extra_input_slots", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.parallel_drafting_token_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.parallel_drafting_hidden_state_tensor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.use_local_argmax_reduction", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.token_arange_np", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.mm_registry", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.supports_mm_inputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.draft_attn_groups", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.kv_cache_gid", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.eagle3_use_aux_hidden_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.cudagraph_dispatcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.input_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.uses_mrope", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.uses_xdrope_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.draft_uses_xdrope_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.hidden_states", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.arange", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.is_rejected_token_mask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.is_masked_token_mask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.inputs_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.backup_next_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.allowed_attn_types", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.tree_choices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.cu_drafts_per_level", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.child_drafts_per_level", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.tree_draft_pos_offsets", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.mrope_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.xdrope_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodeBaseProposer.positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 137, "n_typed": 93, "n_any": 0, "n_untyped": 44, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 28, "n_method_overloads": 28, "n_method_params": 62, "n_attrs": 47, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.spec_decode.eagle.EagleProposer", "methods": [ { "kind": "function", "name": "EagleProposer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.spec_decode.eagle.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.spec_decode.eagle.compute_probs_and_sample_next_token", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.v1.spec_decode.eagle", "names": [ "vllm.v1.spec_decode.eagle.EagleProposer", "vllm.v1.spec_decode.eagle.SpecDecodeBaseProposer", "vllm.v1.spec_decode.eagle.compute_probs_and_sample_next_token", "vllm.v1.spec_decode.eagle.logger" ], "n_typable": 145, "n_typed": 98, "n_any": 0, "n_untyped": 47, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 29, "n_method_overloads": 29, "n_method_params": 65, "n_classes": 2, "n_attrs": 48, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/spec_decode/extract_hidden_states.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.spec_decode.extract_hidden_states.PADDING_SLOT_ID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.spec_decode.extract_hidden_states.ExtractHiddenStatesProposer", "methods": [ { "kind": "function", "name": "ExtractHiddenStatesProposer.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExtractHiddenStatesProposer.propose", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ExtractHiddenStatesProposer._get_slot_mapping", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExtractHiddenStatesProposer._determine_batch_execution_and_padding", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ExtractHiddenStatesProposer.initialize_cudagraph_keys", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExtractHiddenStatesProposer.dummy_run", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ExtractHiddenStatesProposer._build_attn_metadata_builder", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExtractHiddenStatesProposer.prepare_next_token_ids_padded", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "ExtractHiddenStatesProposer.load_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ExtractHiddenStatesProposer.validate_same_kv_cache_group", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ExtractHiddenStatesProposer.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesProposer.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesProposer.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesProposer.dp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesProposer.model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesProposer.attn_layer_names", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesProposer.attn_metadata_builder", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesProposer.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesProposer.hf_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesProposer.num_hidden_states", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesProposer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesProposer.hidden_states", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ExtractHiddenStatesProposer.cudagraph_dispatcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 47, "n_typed": 35, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 24, "n_attrs": 13, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.spec_decode.extract_hidden_states", "names": [ "vllm.v1.spec_decode.extract_hidden_states.ExtractHiddenStatesProposer", "vllm.v1.spec_decode.extract_hidden_states.PADDING_SLOT_ID" ], "n_typable": 47, "n_typed": 35, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 24, "n_classes": 1, "n_attrs": 14, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/spec_decode/medusa.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.spec_decode.medusa.MedusaProposer", "methods": [ { "kind": "function", "name": "MedusaProposer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MedusaProposer.propose", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "MedusaProposer.load_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MedusaProposer.dummy_run", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MedusaProposer.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MedusaProposer.spec_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MedusaProposer.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MedusaProposer.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MedusaProposer.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MedusaProposer.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 10, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.spec_decode.medusa.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.spec_decode.medusa", "names": [ "vllm.v1.spec_decode.medusa.MedusaProposer", "vllm.v1.spec_decode.medusa.logger" ], "n_typable": 18, "n_typed": 10, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 7, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/spec_decode/metadata.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.spec_decode.metadata.SpecDecodeMetadata", "methods": [ { "kind": "function", "name": "SpecDecodeMetadata.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpecDecodeMetadata.make_dummy", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SpecDecodeMetadata.draft_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpecDecodeMetadata.num_draft_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpecDecodeMetadata.cu_num_draft_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpecDecodeMetadata.cu_num_sampled_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpecDecodeMetadata.target_logits_indices", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpecDecodeMetadata.bonus_logits_indices", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpecDecodeMetadata.logits_indices", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.spec_decode.metadata", "names": [ "vllm.v1.spec_decode.metadata.SpecDecodeMetadata" ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/spec_decode/metrics.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.spec_decode.metrics.SpecDecodingProm", "methods": [ { "kind": "function", "name": "SpecDecodingProm.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SpecDecodingProm.observe", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SpecDecodingProm._counter_cls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpecDecodingProm.spec_decoding_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodingProm.counter_spec_decode_num_drafts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodingProm.counter_spec_decode_num_draft_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodingProm.counter_spec_decode_num_accepted_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SpecDecodingProm.counter_spec_decode_num_accepted_tokens_per_pos", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 12, "n_typed": 6, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.spec_decode.metrics.make_per_engine", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.v1.spec_decode.metrics.SpecDecodingLogging", "methods": [ { "kind": "function", "name": "SpecDecodingLogging.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpecDecodingLogging.reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SpecDecodingLogging.observe", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SpecDecodingLogging.log", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 6, "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 2, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.spec_decode.metrics.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.spec_decode.metrics.SpecDecodingStats", "methods": [ { "kind": "function", "name": "SpecDecodingStats.new", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SpecDecodingStats.observe_draft", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SpecDecodingStats.num_spec_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpecDecodingStats.num_drafts", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpecDecodingStats.num_draft_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpecDecodingStats.num_accepted_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SpecDecodingStats.num_accepted_tokens_per_pos", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 3, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.spec_decode.metrics", "names": [ "vllm.v1.spec_decode.metrics.SpecDecodingLogging", "vllm.v1.spec_decode.metrics.SpecDecodingProm", "vllm.v1.spec_decode.metrics.SpecDecodingStats", "vllm.v1.spec_decode.metrics.logger", "vllm.v1.spec_decode.metrics.make_per_engine" ], "n_typable": 27, "n_typed": 13, "n_any": 0, "n_untyped": 14, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 10, "n_classes": 3, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/spec_decode/ngram_proposer.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.spec_decode.ngram_proposer.NgramProposer", "methods": [ { "kind": "function", "name": "NgramProposer.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "NgramProposer.batch_propose", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NgramProposer.propose", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "NgramProposer.load_model", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "NgramProposer.min_n", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NgramProposer.max_n", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NgramProposer.k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NgramProposer.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NgramProposer.valid_ngram_draft", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NgramProposer.valid_ngram_num_drafts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NgramProposer.num_tokens_threshold", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "NgramProposer.num_numba_thread_available", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 11, "n_any": 0, "n_untyped": 12, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_attrs": 8, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.spec_decode.ngram_proposer.batch_propose_numba", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "type_ignores": [], "name": "vllm.v1.spec_decode.ngram_proposer", "names": [ "vllm.v1.spec_decode.ngram_proposer.NgramProposer", "vllm.v1.spec_decode.ngram_proposer.batch_propose_numba" ], "n_typable": 33, "n_typed": 20, "n_any": 0, "n_untyped": 13, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 9, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_classes": 1, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/spec_decode/suffix_decoding.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.spec_decode.suffix_decoding.SuffixDecodingProposer", "methods": [ { "kind": "function", "name": "SuffixDecodingProposer.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "SuffixDecodingProposer.propose", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SuffixDecodingProposer.load_model", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SuffixDecodingProposer.num_speculative_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SuffixDecodingProposer.max_tree_depth", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SuffixDecodingProposer.max_spec_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SuffixDecodingProposer.min_token_prob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SuffixDecodingProposer.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SuffixDecodingProposer.suffix_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 15, "n_typed": 5, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.spec_decode.suffix_decoding", "names": [ "vllm.v1.spec_decode.suffix_decoding.SuffixDecodingProposer" ], "n_typable": 15, "n_typed": 5, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/spec_decode/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.spec_decode.utils.compute_new_slot_mapping", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.v1.spec_decode.utils.copy_and_expand_eagle_inputs_kernel", "n_typed": 1, "n_any": 0, "n_untyped": 17, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 }, { "kind": "attr", "name": "vllm.v1.spec_decode.utils.PADDING_SLOT_ID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.spec_decode.utils.extend_all_queries_by_N", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.v1.spec_decode.utils.eagle_prepare_inputs_padded_kernel", "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.v1.spec_decode.utils.create_vllm_config_for_draft_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.spec_decode.utils.eagle_prepare_next_token_padded_kernel", "n_typed": 1, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 } ], "type_ignores": [], "name": "vllm.v1.spec_decode.utils", "names": [ "vllm.v1.spec_decode.utils.PADDING_SLOT_ID", "vllm.v1.spec_decode.utils.compute_new_slot_mapping", "vllm.v1.spec_decode.utils.copy_and_expand_eagle_inputs_kernel", "vllm.v1.spec_decode.utils.create_vllm_config_for_draft_model", "vllm.v1.spec_decode.utils.eagle_prepare_inputs_padded_kernel", "vllm.v1.spec_decode.utils.eagle_prepare_next_token_padded_kernel", "vllm.v1.spec_decode.utils.extend_all_queries_by_N" ], "n_typable": 50, "n_typed": 15, "n_any": 0, "n_untyped": 35, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 44, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/structured_output/__init__.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.structured_output.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.structured_output.StructuredOutputManager", "methods": [ { "kind": "function", "name": "StructuredOutputManager.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StructuredOutputManager.grammar_init", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StructuredOutputManager._create_grammar", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StructuredOutputManager._fill_bitmasks", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StructuredOutputManager._async_submit_fill_bitmask", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StructuredOutputManager.grammar_bitmask", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "StructuredOutputManager.should_fill_bitmask", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StructuredOutputManager.should_advance", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StructuredOutputManager.clear_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StructuredOutputManager.backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputManager.reasoner", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputManager.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputManager.fill_bitmask_parallel_threshold", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputManager.enable_in_reasoning", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputManager.fill_bitmask_parallel_batch_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputManager.executor_for_fillmask", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputManager.executor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputManager.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 28, "n_typed": 20, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 10, "n_attrs": 9, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.structured_output.torch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.structured_output", "names": [ "vllm.v1.structured_output.StructuredOutputManager", "vllm.v1.structured_output.logger", "vllm.v1.structured_output.torch" ], "n_typable": 30, "n_typed": 20, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 10, "n_classes": 1, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/structured_output/backend_guidance.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.structured_output.backend_guidance.GuidanceBackend", "methods": [ { "kind": "function", "name": "GuidanceBackend.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GuidanceBackend.compile_grammar", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GuidanceBackend.allocate_token_bitmask", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GuidanceBackend.destroy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 4, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.structured_output.backend_guidance.llguidance_hf", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.structured_output.backend_guidance.process_for_additional_properties", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.v1.structured_output.backend_guidance.GuidanceGrammar", "methods": [ { "kind": "function", "name": "GuidanceGrammar.check_error", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GuidanceGrammar.accept_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GuidanceGrammar.validate_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GuidanceGrammar.rollback", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GuidanceGrammar.fill_bitmask", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GuidanceGrammar.is_terminated", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GuidanceGrammar.reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GuidanceGrammar.ll_matcher", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GuidanceGrammar.ll_tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GuidanceGrammar.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GuidanceGrammar.printed_error", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GuidanceGrammar.terminated", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "GuidanceGrammar.rollback_lag", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 13, "n_typed": 11, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 6, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.structured_output.backend_guidance.llguidance", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.structured_output.backend_guidance.has_guidance_unsupported_json_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.structured_output.backend_guidance.validate_guidance_grammar", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.structured_output.backend_guidance.serialize_guidance_grammar", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "attr", "name": "vllm.v1.structured_output.backend_guidance.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.structured_output.backend_guidance.llguidance_torch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.structured_output.backend_guidance", "names": [ "vllm.v1.structured_output.backend_guidance.GuidanceBackend", "vllm.v1.structured_output.backend_guidance.GuidanceGrammar", "vllm.v1.structured_output.backend_guidance.has_guidance_unsupported_json_features", "vllm.v1.structured_output.backend_guidance.llguidance", "vllm.v1.structured_output.backend_guidance.llguidance_hf", "vllm.v1.structured_output.backend_guidance.llguidance_torch", "vllm.v1.structured_output.backend_guidance.logger", "vllm.v1.structured_output.backend_guidance.process_for_additional_properties", "vllm.v1.structured_output.backend_guidance.serialize_guidance_grammar", "vllm.v1.structured_output.backend_guidance.validate_guidance_grammar" ], "n_typable": 36, "n_typed": 27, "n_any": 0, "n_untyped": 9, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 8, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 9, "n_classes": 2, "n_attrs": 10, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/structured_output/backend_lm_format_enforcer.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.structured_output.backend_lm_format_enforcer.LMFormatEnforcerBackend", "methods": [ { "kind": "function", "name": "LMFormatEnforcerBackend.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMFormatEnforcerBackend.compile_grammar", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LMFormatEnforcerBackend.allocate_token_bitmask", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMFormatEnforcerBackend.destroy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.structured_output.backend_lm_format_enforcer.lmfe_vllm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.structured_output.backend_lm_format_enforcer.LMFormatEnforcerGrammar", "methods": [ { "kind": "function", "name": "LMFormatEnforcerGrammar.accept_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LMFormatEnforcerGrammar.validate_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMFormatEnforcerGrammar.rollback", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LMFormatEnforcerGrammar.fill_bitmask", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LMFormatEnforcerGrammar.is_terminated", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LMFormatEnforcerGrammar.reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LMFormatEnforcerGrammar.token_enforcer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LMFormatEnforcerGrammar.current_tokens_prefix", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.structured_output.backend_lm_format_enforcer.validate_structured_output_request_lm_format_enforcer", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.v1.structured_output.backend_lm_format_enforcer.lmformatenforcer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.structured_output.backend_lm_format_enforcer", "names": [ "vllm.v1.structured_output.backend_lm_format_enforcer.LMFormatEnforcerBackend", "vllm.v1.structured_output.backend_lm_format_enforcer.LMFormatEnforcerGrammar", "vllm.v1.structured_output.backend_lm_format_enforcer.lmfe_vllm", "vllm.v1.structured_output.backend_lm_format_enforcer.lmformatenforcer", "vllm.v1.structured_output.backend_lm_format_enforcer.validate_structured_output_request_lm_format_enforcer" ], "n_typable": 23, "n_typed": 17, "n_any": 0, "n_untyped": 6, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 9, "n_classes": 2, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/structured_output/backend_outlines.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.structured_output.backend_outlines.oc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.structured_output.backend_outlines.OutlinesGrammar", "methods": [ { "kind": "function", "name": "OutlinesGrammar.accept_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OutlinesGrammar.rollback", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OutlinesGrammar.validate_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OutlinesGrammar.fill_bitmask", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OutlinesGrammar.is_terminated", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OutlinesGrammar.reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OutlinesGrammar.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OutlinesGrammar.guide", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OutlinesGrammar.num_processed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "OutlinesGrammar._prev_finished", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.structured_output.backend_outlines.validate_regex_is_buildable", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.v1.structured_output.backend_outlines.OutlinesBackend", "methods": [ { "kind": "function", "name": "OutlinesBackend.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "OutlinesBackend._compile_index", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OutlinesBackend.compile_grammar", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "OutlinesBackend.allocate_token_bitmask", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "OutlinesBackend.destroy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 10, "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.structured_output.backend_outlines.json_schema", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.structured_output.backend_outlines.validate_structured_output_request_outlines", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.v1.structured_output.backend_outlines", "names": [ "vllm.v1.structured_output.backend_outlines.OutlinesBackend", "vllm.v1.structured_output.backend_outlines.OutlinesGrammar", "vllm.v1.structured_output.backend_outlines.json_schema", "vllm.v1.structured_output.backend_outlines.oc", "vllm.v1.structured_output.backend_outlines.validate_regex_is_buildable", "vllm.v1.structured_output.backend_outlines.validate_structured_output_request_outlines" ], "n_typable": 28, "n_typed": 22, "n_any": 0, "n_untyped": 6, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 2, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 11, "n_classes": 2, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/structured_output/backend_types.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.structured_output.backend_types.StructuredOutputBackend", "methods": [ { "kind": "function", "name": "StructuredOutputBackend.compile_grammar", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StructuredOutputBackend.allocate_token_bitmask", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StructuredOutputBackend.destroy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StructuredOutputBackend.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputBackend.tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputBackend.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.structured_output.backend_types.TokenizerLike", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.structured_output.backend_types.StructuredOutputKey", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.structured_output.backend_types.StructuredOutputOptions", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "StructuredOutputOptions.JSON", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputOptions.JSON_OBJECT", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputOptions.REGEX", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputOptions.GRAMMAR", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputOptions.CHOICE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputOptions.STRUCTURAL_TAG", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.structured_output.backend_types.VllmConfig", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.structured_output.backend_types.StructuredOutputGrammar", "methods": [ { "kind": "function", "name": "StructuredOutputGrammar.accept_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StructuredOutputGrammar.validate_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StructuredOutputGrammar.rollback", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StructuredOutputGrammar.fill_bitmask", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StructuredOutputGrammar.is_terminated", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StructuredOutputGrammar.reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.structured_output.backend_types", "names": [ "vllm.v1.structured_output.backend_types.StructuredOutputBackend", "vllm.v1.structured_output.backend_types.StructuredOutputGrammar", "vllm.v1.structured_output.backend_types.StructuredOutputKey", "vllm.v1.structured_output.backend_types.StructuredOutputOptions", "vllm.v1.structured_output.backend_types.TokenizerLike", "vllm.v1.structured_output.backend_types.VllmConfig" ], "n_typable": 18, "n_typed": 16, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 9, "n_classes": 3, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/structured_output/backend_xgrammar.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.structured_output.backend_xgrammar.xgr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.structured_output.backend_xgrammar.XgrammarBackend", "methods": [ { "kind": "function", "name": "XgrammarBackend.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XgrammarBackend.compile_grammar", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "XgrammarBackend.allocate_token_bitmask", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XgrammarBackend.destroy", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 4, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 3, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.structured_output.backend_xgrammar.validate_xgrammar_grammar", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.v1.structured_output.backend_xgrammar.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.structured_output.backend_xgrammar.has_xgrammar_unsupported_json_features", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.v1.structured_output.backend_xgrammar.STRING_SUPPORTED_FORMATS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.structured_output.backend_xgrammar.XgrammarGrammar", "methods": [ { "kind": "function", "name": "XgrammarGrammar.accept_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "XgrammarGrammar.validate_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XgrammarGrammar.rollback", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "XgrammarGrammar.fill_bitmask", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "XgrammarGrammar.is_terminated", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "XgrammarGrammar.reset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "XgrammarGrammar.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "XgrammarGrammar.matcher", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "XgrammarGrammar.ctx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "XgrammarGrammar.num_processed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "XgrammarGrammar._is_terminated", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.structured_output.backend_xgrammar", "names": [ "vllm.v1.structured_output.backend_xgrammar.STRING_SUPPORTED_FORMATS", "vllm.v1.structured_output.backend_xgrammar.XgrammarBackend", "vllm.v1.structured_output.backend_xgrammar.XgrammarGrammar", "vllm.v1.structured_output.backend_xgrammar.has_xgrammar_unsupported_json_features", "vllm.v1.structured_output.backend_xgrammar.logger", "vllm.v1.structured_output.backend_xgrammar.validate_xgrammar_grammar", "vllm.v1.structured_output.backend_xgrammar.xgr" ], "n_typable": 25, "n_typed": 19, "n_any": 0, "n_untyped": 6, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 2, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 9, "n_classes": 2, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/structured_output/request.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.structured_output.request.StructuredOutputRequest", "methods": [ { "kind": "function", "name": "StructuredOutputRequest.from_sampling_params", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "StructuredOutputRequest._check_grammar_completion", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "StructuredOutputRequest.is_grammar_ready", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "StructuredOutputRequest.grammar", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_typable": 2 }, { "kind": "property", "name": "StructuredOutputRequest.structured_output_key", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "StructuredOutputRequest.params", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputRequest._grammar", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "StructuredOutputRequest.reasoning_ended", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 3, "n_properties": 3 }, { "kind": "function", "name": "vllm.v1.structured_output.request.get_structured_output_key", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.v1.structured_output.request", "names": [ "vllm.v1.structured_output.request.StructuredOutputRequest", "vllm.v1.structured_output.request.get_structured_output_key" ], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_classes": 1, "n_attrs": 3, "n_properties": 3, "n_type_ignores": 0 }, { "path": "vllm/v1/structured_output/utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.structured_output.utils.re_replacement_seq", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.structured_output.utils.oc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.structured_output.utils.convert_slow_tokenizer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.structured_output.utils.convert_lark_to_ebnf", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.v1.structured_output.utils.xgr", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.structured_output.utils.choice_as_grammar", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.v1.structured_output.utils.OutlinesVocabulary", "methods": [ { "kind": "function", "name": "OutlinesVocabulary.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "OutlinesVocabulary.inner", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.structured_output.utils.apply_grammar_bitmask", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.v1.structured_output.utils.get_outlines_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.v1.structured_output.utils.CACHE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.structured_output.utils.re_llama_byte_token", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.structured_output.utils.get_outlines_vocabulary", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.v1.structured_output.utils.file_utils", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.structured_output.utils.get_outlines_cache_path", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.v1.structured_output.utils.grammar_is_likely_lark", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.v1.structured_output.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.structured_output.utils", "names": [ "vllm.v1.structured_output.utils.CACHE", "vllm.v1.structured_output.utils.OutlinesVocabulary", "vllm.v1.structured_output.utils.apply_grammar_bitmask", "vllm.v1.structured_output.utils.choice_as_grammar", "vllm.v1.structured_output.utils.convert_lark_to_ebnf", "vllm.v1.structured_output.utils.convert_slow_tokenizer", "vllm.v1.structured_output.utils.file_utils", "vllm.v1.structured_output.utils.get_outlines_cache", "vllm.v1.structured_output.utils.get_outlines_cache_path", "vllm.v1.structured_output.utils.get_outlines_vocabulary", "vllm.v1.structured_output.utils.grammar_is_likely_lark", "vllm.v1.structured_output.utils.logger", "vllm.v1.structured_output.utils.oc", "vllm.v1.structured_output.utils.re_llama_byte_token", "vllm.v1.structured_output.utils.re_replacement_seq", "vllm.v1.structured_output.utils.xgr" ], "n_typable": 25, "n_typed": 16, "n_any": 0, "n_untyped": 9, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 8, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_classes": 1, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.utils.get_engine_client_zmq_addr", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.utils.report_usage_stats", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.v1.utils.ConstantList", "methods": [ { "kind": "function", "name": "ConstantList.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConstantList.append", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConstantList.extend", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConstantList.insert", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConstantList.pop", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConstantList.remove", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConstantList.clear", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConstantList.index", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ConstantList.__getitem__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 3, "n_params": 2, "n_function_overloads": 2, "n_function_params": 2 }, { "kind": "function", "name": "ConstantList.__setitem__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 2, "n_typable": 5, "n_params": 4, "n_function_overloads": 2, "n_function_params": 4 }, { "kind": "function", "name": "ConstantList.__delitem__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConstantList.__iter__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConstantList.__contains__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ConstantList.__len__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConstantList.__repr__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ConstantList.copy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 33, "n_typed": 14, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 18, "n_method_params": 17, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.utils.T", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.utils.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.v1.utils.CpuGpuBuffer", "methods": [ { "kind": "function", "name": "CpuGpuBuffer.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CpuGpuBuffer.copy_to_gpu", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CpuGpuBuffer.copy_to_cpu", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CpuGpuBuffer.cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CpuGpuBuffer.gpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CpuGpuBuffer.np", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 13, "n_typed": 11, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 7, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.utils.wait_for_completion_or_failure", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.utils.record_function_or_nullcontext", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.utils.tensor_data", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.v1.utils.APIServerProcessManager", "methods": [ { "kind": "function", "name": "APIServerProcessManager.__init__", "n_typed": 7, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "APIServerProcessManager.close", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "APIServerProcessManager.listen_address", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "APIServerProcessManager.sock", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "APIServerProcessManager.args", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "APIServerProcessManager.processes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 14, "n_typed": 9, "n_any": 1, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 8, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.utils.IterationDetails", "methods": [ { "kind": "function", "name": "IterationDetails.__repr__", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "IterationDetails.num_ctx_requests", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IterationDetails.num_ctx_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IterationDetails.num_generation_requests", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "IterationDetails.num_generation_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.utils.copy_slice", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.v1.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.utils.compute_iteration_details", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.v1.utils", "names": [ "vllm.v1.utils.APIServerProcessManager", "vllm.v1.utils.ConstantList", "vllm.v1.utils.CpuGpuBuffer", "vllm.v1.utils.IterationDetails", "vllm.v1.utils.T", "vllm.v1.utils.compute_iteration_details", "vllm.v1.utils.copy_slice", "vllm.v1.utils.get_engine_client_zmq_addr", "vllm.v1.utils.logger", "vllm.v1.utils.record_function_or_nullcontext", "vllm.v1.utils.report_usage_stats", "vllm.v1.utils.shutdown", "vllm.v1.utils.tensor_data", "vllm.v1.utils.wait_for_completion_or_failure" ], "n_typable": 85, "n_typed": 56, "n_any": 1, "n_untyped": 28, "n_functions": 8, "n_function_overloads": 8, "n_function_params": 15, "n_methods": 22, "n_method_overloads": 24, "n_method_params": 32, "n_classes": 4, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/block_table.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.block_table.BlockTable", "methods": [ { "kind": "function", "name": "BlockTable.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "BlockTable.append_row", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BlockTable.add_row", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BlockTable.move_row", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BlockTable.swap_row", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BlockTable.compute_slot_mapping", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BlockTable.commit_block_table", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BlockTable.commit_slot_mapping", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BlockTable.clear", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BlockTable.map_to_kernel_blocks", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BlockTable.get_device_tensor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BlockTable.get_cpu_tensor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BlockTable.get_numpy_array", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BlockTable._make_buffer", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlockTable.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTable.max_num_batched_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTable.pin_memory", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTable.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTable.max_num_blocks_per_req", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTable.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTable.num_blocks_per_row", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTable.slot_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTable.cp_kv_cache_interleave_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTable.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTable.blocks_per_kv_block", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTable.use_hybrid_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTable.pcp_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTable.pcp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTable.dcp_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTable.dcp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 56, "n_typed": 39, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 14, "n_method_overloads": 14, "n_method_params": 26, "n_attrs": 16, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.worker.block_table.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.worker.block_table.MultiGroupBlockTable", "methods": [ { "kind": "function", "name": "MultiGroupBlockTable.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "MultiGroupBlockTable.append_row", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiGroupBlockTable.add_row", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiGroupBlockTable.move_row", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiGroupBlockTable.swap_row", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiGroupBlockTable.compute_slot_mapping", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "MultiGroupBlockTable.commit_block_table", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiGroupBlockTable.commit_slot_mapping", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "MultiGroupBlockTable.clear", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MultiGroupBlockTable.__getitem__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MultiGroupBlockTable.block_tables", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 32, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 22, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.block_table", "names": [ "vllm.v1.worker.block_table.BlockTable", "vllm.v1.worker.block_table.MultiGroupBlockTable", "vllm.v1.worker.block_table.logger" ], "n_typable": 90, "n_typed": 71, "n_any": 0, "n_untyped": 19, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 24, "n_method_overloads": 24, "n_method_params": 48, "n_classes": 2, "n_attrs": 18, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/cp_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.cp_utils.check_attention_cp_compatibility", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.v1.worker.cp_utils.AttentionLayerBase", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.worker.cp_utils.get_total_cp_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.cp_utils", "names": [ "vllm.v1.worker.cp_utils.AttentionLayerBase", "vllm.v1.worker.cp_utils.check_attention_cp_compatibility", "vllm.v1.worker.cp_utils.get_total_cp_world_size" ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/cpu_model_runner.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.cpu_model_runner.CPUModelRunner", "methods": [ { "kind": "function", "name": "CPUModelRunner.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CPUModelRunner._postprocess_tensors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUModelRunner.load_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUModelRunner.get_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUModelRunner.warming_up_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUModelRunner._init_device_properties", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUModelRunner._sync_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUModelRunner.get_dp_padding", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CPUModelRunner.use_cuda_graph", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CPUModelRunner.cascade_attn_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 11, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.worker.cpu_model_runner.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.worker.cpu_model_runner", "names": [ "vllm.v1.worker.cpu_model_runner.CPUModelRunner", "vllm.v1.worker.cpu_model_runner.logger" ], "n_typable": 15, "n_typed": 11, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 4, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/cpu_worker.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.worker.cpu_worker.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.worker.cpu_worker.CPUWorker", "methods": [ { "kind": "function", "name": "CPUWorker.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "CPUWorker.init_device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUWorker.sleep", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUWorker.wake_up", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUWorker.determine_available_memory", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUWorker.compile_or_warm_up_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CPUWorker._get_autobind_cpu_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "CPUWorker.profile", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CPUWorker.profiler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 19, "n_typed": 16, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 10, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.cpu_worker", "names": [ "vllm.v1.worker.cpu_worker.CPUWorker", "vllm.v1.worker.cpu_worker.logger" ], "n_typable": 20, "n_typed": 16, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 10, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/dp_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.dp_utils.coordinate_batch_across_dp", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "attr", "name": "vllm.v1.worker.dp_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.worker.dp_utils", "names": [ "vllm.v1.worker.dp_utils.coordinate_batch_across_dp", "vllm.v1.worker.dp_utils.logger" ], "n_typable": 9, "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 7, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/ec_connector_model_runner_mixin.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.ec_connector_model_runner_mixin.ECConnectorModelRunnerMixin", "methods": [ { "kind": "function", "name": "ECConnectorModelRunnerMixin.maybe_save_ec_to_connector", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ECConnectorModelRunnerMixin.get_finished_ec_transfers", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ECConnectorModelRunnerMixin.maybe_get_ec_connector_output", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ECConnectorModelRunnerMixin._get_ec_connector_output", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 13, "n_typed": 10, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.worker.ec_connector_model_runner_mixin.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.worker.ec_connector_model_runner_mixin", "names": [ "vllm.v1.worker.ec_connector_model_runner_mixin.ECConnectorModelRunnerMixin", "vllm.v1.worker.ec_connector_model_runner_mixin.logger" ], "n_typable": 14, "n_typed": 10, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/async_utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.async_utils.AsyncOutput", "methods": [ { "kind": "function", "name": "AsyncOutput.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "AsyncOutput.get_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AsyncOutput.model_runner_output", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncOutput.sampler_output", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncOutput.num_sampled_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncOutput.copy_event", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncOutput.sampled_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncOutput.logprobs_tensors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AsyncOutput.num_nans", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "AsyncOutput.num_sampled_tokens_np", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncOutput.prompt_logprobs_dict", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 17, "n_typed": 9, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 9, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.worker.gpu.async_utils.async_copy_to_np", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.v1.worker.gpu.async_utils.AsyncPoolingOutput", "methods": [ { "kind": "function", "name": "AsyncPoolingOutput.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "AsyncPoolingOutput.get_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AsyncPoolingOutput.model_runner_output", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncPoolingOutput.pooler_output", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncPoolingOutput.is_valid", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncPoolingOutput.copy_event", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncPoolingOutput.pooler_output_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncPoolingOutput.is_valid_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 7, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.worker.gpu.async_utils.stream", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.async_utils", "names": [ "vllm.v1.worker.gpu.async_utils.AsyncOutput", "vllm.v1.worker.gpu.async_utils.AsyncPoolingOutput", "vllm.v1.worker.gpu.async_utils.async_copy_to_np", "vllm.v1.worker.gpu.async_utils.stream" ], "n_typable": 36, "n_typed": 20, "n_any": 0, "n_untyped": 16, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 3, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_classes": 2, "n_attrs": 15, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/attn_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.attn_utils.init_attn_backend", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.worker.gpu.attn_utils.build_attn_metadata", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "vllm.v1.worker.gpu.attn_utils.build_slot_mappings_by_layer", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.worker.gpu.attn_utils.get_kv_cache_spec", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.worker.gpu.attn_utils.init_kv_cache", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.attn_utils", "names": [ "vllm.v1.worker.gpu.attn_utils.build_attn_metadata", "vllm.v1.worker.gpu.attn_utils.build_slot_mappings_by_layer", "vllm.v1.worker.gpu.attn_utils.get_kv_cache_spec", "vllm.v1.worker.gpu.attn_utils.init_attn_backend", "vllm.v1.worker.gpu.attn_utils.init_kv_cache" ], "n_typable": 28, "n_typed": 27, "n_any": 0, "n_untyped": 1, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 23, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/block_table.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.block_table.BlockTables", "methods": [ { "kind": "function", "name": "BlockTables.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "BlockTables._make_ptr_tensor", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BlockTables.append_block_ids", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BlockTables.apply_staged_writes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BlockTables.gather_block_tables", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BlockTables.get_dummy_block_tables", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BlockTables.compute_slot_mappings", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BlockTables.get_dummy_slot_mappings", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlockTables.block_sizes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.max_num_batched_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.cp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.cp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.cp_interleave", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.num_kv_cache_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.block_tables", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.block_table_ptrs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.block_table_strides", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.block_sizes_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.num_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.input_block_tables", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.input_block_table_ptrs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockTables.slot_mappings", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 43, "n_typed": 27, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 18, "n_attrs": 17, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.block_table", "names": [ "vllm.v1.worker.gpu.block_table.BlockTables" ], "n_typable": 43, "n_typed": 27, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 18, "n_classes": 1, "n_attrs": 17, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/buffer_utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.buffer_utils.UvaBackedTensor", "methods": [ { "kind": "function", "name": "UvaBackedTensor.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "UvaBackedTensor.copy_to_uva", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "UvaBackedTensor.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UvaBackedTensor.max_concurrency", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UvaBackedTensor.cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UvaBackedTensor.np", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UvaBackedTensor.pool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UvaBackedTensor.gpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 5, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.worker.gpu.buffer_utils.async_copy_to_gpu", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.v1.worker.gpu.buffer_utils.UvaBuffer", "methods": [ { "kind": "function", "name": "UvaBuffer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "UvaBuffer.cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UvaBuffer.np", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UvaBuffer.uva", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 6, "n_typed": 2, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 2, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.worker.gpu.buffer_utils.StagedWriteTensor", "methods": [ { "kind": "function", "name": "StagedWriteTensor.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "StagedWriteTensor.stage_write", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "StagedWriteTensor.stage_write_elem", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StagedWriteTensor.apply_write", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StagedWriteTensor.clear_staged_writes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StagedWriteTensor.num_rows", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StagedWriteTensor.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StagedWriteTensor.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StagedWriteTensor.max_concurrency", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StagedWriteTensor.write_indices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StagedWriteTensor.write_starts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StagedWriteTensor.write_cu_lens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StagedWriteTensor.gpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 14, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 10, "n_attrs": 8, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.worker.gpu.buffer_utils.UvaBufferPool", "methods": [ { "kind": "function", "name": "UvaBufferPool.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "UvaBufferPool.copy_to_uva", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UvaBufferPool.copy_to_gpu", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "UvaBufferPool.size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UvaBufferPool.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UvaBufferPool.max_concurrency", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.buffer_utils", "names": [ "vllm.v1.worker.gpu.buffer_utils.StagedWriteTensor", "vllm.v1.worker.gpu.buffer_utils.UvaBackedTensor", "vllm.v1.worker.gpu.buffer_utils.UvaBuffer", "vllm.v1.worker.gpu.buffer_utils.UvaBufferPool", "vllm.v1.worker.gpu.buffer_utils.async_copy_to_gpu" ], "n_typable": 57, "n_typed": 33, "n_any": 0, "n_untyped": 24, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 22, "n_classes": 4, "n_attrs": 20, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/cp_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.cp_utils.prepare_dcp_local_seq_lens", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.cp_utils", "names": [ "vllm.v1.worker.gpu.cp_utils.prepare_dcp_local_seq_lens" ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/cudagraph_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.cudagraph_utils.capture_graphs", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.v1.worker.gpu.cudagraph_utils.prepare_inputs_to_capture", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "class", "name": "vllm.v1.worker.gpu.cudagraph_utils.CudaGraphManager", "methods": [ { "kind": "function", "name": "CudaGraphManager.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CudaGraphManager.needs_capture", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CudaGraphManager.get_cudagraph_size", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "CudaGraphManager.capture_graph", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "CudaGraphManager._capture_full_graph", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "CudaGraphManager._capture_piecewise_graph", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "CudaGraphManager.capture", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "CudaGraphManager.get_cudagraph_runtime_mode", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "CudaGraphManager.run_fullgraph", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "CudaGraphManager.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaGraphManager.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaGraphManager.use_aux_hidden_state_outputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaGraphManager.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaGraphManager.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaGraphManager.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaGraphManager.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaGraphManager.dp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaGraphManager.uniform_decode_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaGraphManager.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaGraphManager.cudagraph_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaGraphManager.graphs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudaGraphManager.pool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "CudaGraphManager.hidden_states", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "CudaGraphManager.aux_hidden_states", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 66, "n_typed": 53, "n_any": 0, "n_untyped": 13, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 42, "n_attrs": 15, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.worker.gpu.cudagraph_utils.get_cudagraph_sizes", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.cudagraph_utils", "names": [ "vllm.v1.worker.gpu.cudagraph_utils.CudaGraphManager", "vllm.v1.worker.gpu.cudagraph_utils.capture_graphs", "vllm.v1.worker.gpu.cudagraph_utils.get_cudagraph_sizes", "vllm.v1.worker.gpu.cudagraph_utils.prepare_inputs_to_capture" ], "n_typable": 88, "n_typed": 74, "n_any": 0, "n_untyped": 14, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 19, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 42, "n_classes": 1, "n_attrs": 15, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/dp_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.dp_utils.make_num_tokens_across_dp", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.worker.gpu.dp_utils.get_cudagraph_and_dp_padding", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.v1.worker.gpu.dp_utils.get_batch_metadata_across_dp", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.dp_utils", "names": [ "vllm.v1.worker.gpu.dp_utils.get_batch_metadata_across_dp", "vllm.v1.worker.gpu.dp_utils.get_cudagraph_and_dp_padding", "vllm.v1.worker.gpu.dp_utils.make_num_tokens_across_dp" ], "n_typable": 15, "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 12, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/input_batch.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.input_batch.prepare_pos_seq_lens", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.v1.worker.gpu.input_batch.combine_sampled_and_draft_tokens", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.v1.worker.gpu.input_batch.post_update", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "class", "name": "vllm.v1.worker.gpu.input_batch.InputBatch", "methods": [ { "kind": "function", "name": "InputBatch.make_dummy", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InputBatch.req_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.idx_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.idx_mapping_np", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.expanded_idx_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.expanded_local_pos", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.num_scheduled_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.num_tokens_after_padding", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.num_draft_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.query_start_loc_np", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.dcp_local_seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.input_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.positions", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.logits_indices", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.cu_num_logits", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.cu_num_logits_np", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "InputBatch.has_structured_output_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 20, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.worker.gpu.input_batch.prepare_prefill_inputs", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "class", "name": "vllm.v1.worker.gpu.input_batch.InputBuffers", "methods": [ { "kind": "function", "name": "InputBuffers.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "InputBuffers.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBuffers.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBuffers.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBuffers.input_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBuffers.positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBuffers.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBuffers.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBuffers.dcp_local_seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 12, "n_typed": 3, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 8, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.worker.gpu.input_batch.get_num_sampled_and_rejected", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.v1.worker.gpu.input_batch.post_update_pool", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.worker.gpu.input_batch.expand_idx_mapping", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.input_batch", "names": [ "vllm.v1.worker.gpu.input_batch.InputBatch", "vllm.v1.worker.gpu.input_batch.InputBuffers", "vllm.v1.worker.gpu.input_batch.combine_sampled_and_draft_tokens", "vllm.v1.worker.gpu.input_batch.expand_idx_mapping", "vllm.v1.worker.gpu.input_batch.get_num_sampled_and_rejected", "vllm.v1.worker.gpu.input_batch.post_update", "vllm.v1.worker.gpu.input_batch.post_update_pool", "vllm.v1.worker.gpu.input_batch.prepare_pos_seq_lens", "vllm.v1.worker.gpu.input_batch.prepare_prefill_inputs" ], "n_typable": 66, "n_typed": 57, "n_any": 0, "n_untyped": 9, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 43, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_classes": 2, "n_attrs": 28, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/kv_connector.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.kv_connector.KVConnector", "methods": [ { "kind": "function", "name": "KVConnector.pre_forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnector.post_forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KVConnector.no_forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "KVConnector.set_disabled", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.worker.gpu.kv_connector.get_kv_connector", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.v1.worker.gpu.kv_connector.ActiveKVConnector", "methods": [ { "kind": "function", "name": "ActiveKVConnector.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ActiveKVConnector.pre_forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ActiveKVConnector.post_forward", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ActiveKVConnector.clear_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ActiveKVConnector.no_forward", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "ActiveKVConnector.set_disabled", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "ActiveKVConnector.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "ActiveKVConnector.kv_connector", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 16, "n_typed": 13, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 8, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.worker.gpu.kv_connector.NO_OP_KV_CONNECTOR", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.kv_connector", "names": [ "vllm.v1.worker.gpu.kv_connector.ActiveKVConnector", "vllm.v1.worker.gpu.kv_connector.KVConnector", "vllm.v1.worker.gpu.kv_connector.NO_OP_KV_CONNECTOR", "vllm.v1.worker.gpu.kv_connector.get_kv_connector" ], "n_typable": 29, "n_typed": 25, "n_any": 0, "n_untyped": 4, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 13, "n_classes": 2, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/lora_utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.worker.gpu.lora_utils.NO_LORA_ID", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.worker.gpu.lora_utils.LoraState", "methods": [ { "kind": "function", "name": "LoraState.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoraState.add_request", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LoraState.remove_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoraState.make_lora_inputs", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LoraState.lora_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LoraState.lora_requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 14, "n_typed": 12, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.lora_utils", "names": [ "vllm.v1.worker.gpu.lora_utils.LoraState", "vllm.v1.worker.gpu.lora_utils.NO_LORA_ID" ], "n_typable": 14, "n_typed": 12, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/metrics/logits.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.metrics.logits.get_num_nans", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.metrics.logits", "names": [ "vllm.v1.worker.gpu.metrics.logits.get_num_nans" ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/mm/encoder_cache.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.mm.encoder_cache.EncoderCache", "methods": [ { "kind": "function", "name": "EncoderCache.__init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EncoderCache.add_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EncoderCache.remove_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EncoderCache.reset_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EncoderCache.reset_encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EncoderCache.free_encoder_cache", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EncoderCache.mm_features", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EncoderCache.encoder_outputs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.mm.encoder_cache", "names": [ "vllm.v1.worker.gpu.mm.encoder_cache.EncoderCache" ], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 4, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/mm/encoder_runner.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.mm.encoder_runner.EncoderRunner", "methods": [ { "kind": "function", "name": "EncoderRunner.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "EncoderRunner.prepare_mm_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EncoderRunner.execute_mm_encoder", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EncoderRunner.gather_mm_embeddings", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "EncoderRunner.get_inputs_embeds", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EncoderRunner.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderRunner.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderRunner.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderRunner.encoder_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderRunner.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderRunner.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EncoderRunner.inputs_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 21, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 17, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.mm.encoder_runner", "names": [ "vllm.v1.worker.gpu.mm.encoder_runner.EncoderRunner" ], "n_typable": 29, "n_typed": 21, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 17, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/mm/mrope_utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.mm.mrope_utils.MRopeState", "methods": [ { "kind": "function", "name": "MRopeState.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MRopeState.init_prefill_mrope_positions", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "MRopeState.apply_staged_writes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "MRopeState.prepare_mrope_positions", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MRopeState.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRopeState.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRopeState.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRopeState.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRopeState.prefill_mrope_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRopeState.prefill_mrope_delta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "MRopeState.mrope_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 15, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.mm.mrope_utils", "names": [ "vllm.v1.worker.gpu.mm.mrope_utils.MRopeState" ], "n_typable": 23, "n_typed": 15, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/model_runner.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.worker.gpu.model_runner.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.worker.gpu.model_runner.GPUModelRunner", "methods": [ { "kind": "function", "name": "GPUModelRunner.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner.update_max_model_len", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.load_model", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner.get_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.get_kv_cache_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.initialize_kv_cache", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._dummy_run", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "GPUModelRunner._dummy_sampler_run", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._dummy_pooler_run", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.profile_run", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.reset_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.reset_encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._get_num_input_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.capture_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.warmup_for_prefill", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.finish_requests", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.free_states", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.add_requests", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.update_requests", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.prepare_inputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner.prepare_attn", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.prepare_dummy_attn", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.sample", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GPUModelRunner.postprocess", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPUModelRunner.execute_model", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPUModelRunner.sample_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.take_draft_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.pool", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.postprocess_pool", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "GPUModelRunner.main_stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "GPUModelRunner.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.lora_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.load_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.speculative_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.observability_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.use_async_scheduling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.output_copy_stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.output_copy_event", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.pp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.use_pp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.dcp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.use_dcp", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.dcp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.cp_interleave", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.mm_registry", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.supports_mm_inputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.encoder_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.speculator", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.num_speculative_steps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.use_aux_hidden_state_outputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.draft_tokens_handler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.req_states", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.input_buffers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.sampler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.prompt_logprobs_worker", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.cudagraph_manager", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.structured_outputs_worker", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.lora_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.kv_connector", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.pooling_runner", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.execute_model_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.is_first_pp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.is_last_pp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 112, "n_typed": 63, "n_any": 0, "n_untyped": 49, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 30, "n_method_overloads": 30, "n_method_params": 35, "n_attrs": 46, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.model_runner", "names": [ "vllm.v1.worker.gpu.model_runner.GPUModelRunner", "vllm.v1.worker.gpu.model_runner.logger" ], "n_typable": 113, "n_typed": 63, "n_any": 0, "n_untyped": 50, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 30, "n_method_overloads": 30, "n_method_params": 35, "n_classes": 1, "n_attrs": 47, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/model_states/__init__.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.model_states.init_model_state", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.model_states", "names": [ "vllm.v1.worker.gpu.model_states.init_model_state" ], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/model_states/default.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.model_states.default.DefaultModelState", "methods": [ { "kind": "function", "name": "DefaultModelState.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "DefaultModelState.add_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DefaultModelState.apply_staged_writes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "DefaultModelState.get_mm_embeddings", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "DefaultModelState.prepare_inputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DefaultModelState.prepare_dummy_inputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DefaultModelState.prepare_attn", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DefaultModelState.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultModelState.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultModelState.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultModelState.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultModelState.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultModelState.supports_mm_inputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultModelState.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultModelState.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultModelState.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultModelState.inputs_embeds_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultModelState.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultModelState.uses_mrope", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultModelState.encoder_cache", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultModelState.encoder_runner", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DefaultModelState.mrope_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 40, "n_typed": 24, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 18, "n_attrs": 15, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.model_states.default", "names": [ "vllm.v1.worker.gpu.model_states.default.DefaultModelState" ], "n_typable": 40, "n_typed": 24, "n_any": 0, "n_untyped": 16, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 18, "n_classes": 1, "n_attrs": 15, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/model_states/interface.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.model_states.interface.ModelState", "methods": [ { "kind": "function", "name": "ModelState.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "ModelState.add_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelState.apply_staged_writes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ModelState.get_mm_embeddings", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "ModelState.prepare_inputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelState.prepare_dummy_inputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "ModelState.prepare_attn", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 25, "n_typed": 25, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 18, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.model_states.interface", "names": [ "vllm.v1.worker.gpu.model_states.interface.ModelState" ], "n_typable": 25, "n_typed": 25, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 18, "n_classes": 1, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/pool/pooling_runner.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.pool.pooling_runner.PoolingRunner", "methods": [ { "kind": "function", "name": "PoolingRunner.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PoolingRunner.get_supported_pooling_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PoolingRunner.pool", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PoolingRunner.dummy_pooler_run", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PoolingRunner.model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 10, "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.pool.pooling_runner", "names": [ "vllm.v1.worker.gpu.pool.pooling_runner.PoolingRunner" ], "n_typable": 10, "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 5, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/pp_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.pp_utils.pp_broadcast", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.worker.gpu.pp_utils.pp_receive", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.pp_utils", "names": [ "vllm.v1.worker.gpu.pp_utils.pp_broadcast", "vllm.v1.worker.gpu.pp_utils.pp_receive" ], "n_typable": 7, "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 5, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/sample/bad_words.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.sample.bad_words.BadWordsState", "methods": [ { "kind": "function", "name": "BadWordsState.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "BadWordsState.add_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BadWordsState.apply_staged_writes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "BadWordsState.apply_bad_words", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BadWordsState.req_states", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BadWordsState.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BadWordsState.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BadWordsState.bad_word_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BadWordsState.bad_word_offsets", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BadWordsState.num_bad_words", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 18, "n_typed": 11, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_attrs": 6, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.worker.gpu.sample.bad_words.MAX_NUM_BAD_WORDS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.worker.gpu.sample.bad_words.MAX_BAD_WORDS_TOTAL_TOKENS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.worker.gpu.sample.bad_words.apply_bad_words", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.sample.bad_words", "names": [ "vllm.v1.worker.gpu.sample.bad_words.BadWordsState", "vllm.v1.worker.gpu.sample.bad_words.MAX_BAD_WORDS_TOTAL_TOKENS", "vllm.v1.worker.gpu.sample.bad_words.MAX_NUM_BAD_WORDS", "vllm.v1.worker.gpu.sample.bad_words.apply_bad_words" ], "n_typable": 30, "n_typed": 23, "n_any": 0, "n_untyped": 7, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 11, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 8, "n_classes": 1, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/sample/gumbel.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.sample.gumbel.gumbel_sample", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.v1.worker.gpu.sample.gumbel.apply_temperature", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.sample.gumbel", "names": [ "vllm.v1.worker.gpu.sample.gumbel.apply_temperature", "vllm.v1.worker.gpu.sample.gumbel.gumbel_sample" ], "n_typable": 11, "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 9, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/sample/logit_bias.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.worker.gpu.sample.logit_bias.MAX_NUM_STOP_TOKEN_IDS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.worker.gpu.sample.logit_bias.MAX_NUM_ALLOWED_TOKEN_IDS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.worker.gpu.sample.logit_bias.LogitBiasState", "methods": [ { "kind": "function", "name": "LogitBiasState.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LogitBiasState.add_request", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LogitBiasState.apply_staged_writes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LogitBiasState.apply_logit_bias", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "LogitBiasState.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasState.num_allowed_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasState.allowed_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasState.num_logit_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasState.logit_bias_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasState.logit_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasState.min_lens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasState.num_stop_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasState.stop_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "LogitBiasState.use_logit_bias", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 23, "n_typed": 12, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.worker.gpu.sample.logit_bias.MAX_NUM_LOGIT_BIAS_TOKENS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.v1.worker.gpu.sample.logit_bias.apply_logit_bias", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.sample.logit_bias", "names": [ "vllm.v1.worker.gpu.sample.logit_bias.LogitBiasState", "vllm.v1.worker.gpu.sample.logit_bias.MAX_NUM_ALLOWED_TOKEN_IDS", "vllm.v1.worker.gpu.sample.logit_bias.MAX_NUM_LOGIT_BIAS_TOKENS", "vllm.v1.worker.gpu.sample.logit_bias.MAX_NUM_STOP_TOKEN_IDS", "vllm.v1.worker.gpu.sample.logit_bias.apply_logit_bias" ], "n_typable": 35, "n_typed": 24, "n_any": 0, "n_untyped": 11, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 11, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_classes": 1, "n_attrs": 13, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/sample/logprob.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.sample.logprob.compute_topk_logprobs", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.v1.worker.gpu.sample.logprob.compute_token_logprobs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.sample.logprob", "names": [ "vllm.v1.worker.gpu.sample.logprob.compute_token_logprobs", "vllm.v1.worker.gpu.sample.logprob.compute_topk_logprobs" ], "n_typable": 8, "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 6, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/sample/min_p.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.sample.min_p.apply_min_p", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.sample.min_p", "names": [ "vllm.v1.worker.gpu.sample.min_p.apply_min_p" ], "n_typable": 4, "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/sample/output.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.sample.output.SamplerOutput", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "SamplerOutput.sampled_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplerOutput.logprobs_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SamplerOutput.num_nans", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.sample.output", "names": [ "vllm.v1.worker.gpu.sample.output.SamplerOutput" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/sample/penalties.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.sample.penalties.apply_penalties", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "vllm.v1.worker.gpu.sample.penalties.use_penalty", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.v1.worker.gpu.sample.penalties.PenaltiesState", "methods": [ { "kind": "function", "name": "PenaltiesState.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PenaltiesState.add_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PenaltiesState.apply_staged_writes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PenaltiesState.apply_penalties", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PenaltiesState.req_states", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PenaltiesState.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PenaltiesState.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PenaltiesState.repetition_penalty", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PenaltiesState.frequency_penalty", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PenaltiesState.presence_penalty", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PenaltiesState.use_penalty", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PenaltiesState.prompt_bin_mask", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PenaltiesState.output_bin_counts", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 22, "n_typed": 12, "n_any": 0, "n_untyped": 10, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_attrs": 9, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.worker.gpu.sample.penalties.bincount", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.sample.penalties", "names": [ "vllm.v1.worker.gpu.sample.penalties.PenaltiesState", "vllm.v1.worker.gpu.sample.penalties.apply_penalties", "vllm.v1.worker.gpu.sample.penalties.bincount", "vllm.v1.worker.gpu.sample.penalties.use_penalty" ], "n_typable": 43, "n_typed": 33, "n_any": 0, "n_untyped": 10, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 18, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 9, "n_classes": 1, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/sample/prompt_logprob.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.sample.prompt_logprob.compute_prompt_logprobs_with_chunking", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.worker.gpu.sample.prompt_logprob.get_prompt_logprobs_token_ids", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.v1.worker.gpu.sample.prompt_logprob.PromptLogprobsWorker", "methods": [ { "kind": "function", "name": "PromptLogprobsWorker.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PromptLogprobsWorker.add_request", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "PromptLogprobsWorker.remove_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PromptLogprobsWorker.compute_prompt_logprobs", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PromptLogprobsWorker.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PromptLogprobsWorker.uses_prompt_logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PromptLogprobsWorker.in_progress_prompt_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 20, "n_typed": 16, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_attrs": 3, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.sample.prompt_logprob", "names": [ "vllm.v1.worker.gpu.sample.prompt_logprob.PromptLogprobsWorker", "vllm.v1.worker.gpu.sample.prompt_logprob.compute_prompt_logprobs_with_chunking", "vllm.v1.worker.gpu.sample.prompt_logprob.get_prompt_logprobs_token_ids" ], "n_typable": 30, "n_typed": 26, "n_any": 0, "n_untyped": 4, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 8, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 13, "n_classes": 1, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/sample/sampler.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.sample.sampler.Sampler", "methods": [ { "kind": "function", "name": "Sampler.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "Sampler.add_request", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Sampler.apply_staged_writes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Sampler.__call__", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "Sampler.sample", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Sampler.logprobs_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Sampler.compute_nans", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Sampler.sampling_states", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Sampler.penalties_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Sampler.logit_bias_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Sampler.bad_words_state", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Sampler.num_speculative_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 26, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 22, "n_attrs": 7, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.sample.sampler", "names": [ "vllm.v1.worker.gpu.sample.sampler.Sampler" ], "n_typable": 34, "n_typed": 26, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 22, "n_classes": 1, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/sample/states.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.worker.gpu.sample.states.NO_LOGPROBS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.worker.gpu.sample.states.SamplingStates", "methods": [ { "kind": "function", "name": "SamplingStates.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SamplingStates.add_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SamplingStates.apply_staged_writes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SamplingStates.apply_temperature", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SamplingStates.apply_min_p", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SamplingStates.apply_top_k_top_p", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SamplingStates.max_num_logprobs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SamplingStates.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SamplingStates.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SamplingStates.temperature", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SamplingStates.top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SamplingStates.top_p", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SamplingStates.min_p", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SamplingStates.seeds", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SamplingStates.num_logprobs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 29, "n_typed": 20, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 14, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.sample.states", "names": [ "vllm.v1.worker.gpu.sample.states.NO_LOGPROBS", "vllm.v1.worker.gpu.sample.states.SamplingStates" ], "n_typable": 29, "n_typed": 20, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 14, "n_classes": 1, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/spec_decode/__init__.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.spec_decode.init_speculator", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.spec_decode", "names": [ "vllm.v1.worker.gpu.spec_decode.init_speculator" ], "n_typable": 3, "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/spec_decode/eagle/cudagraph.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.spec_decode.eagle.cudagraph.EagleCudaGraphManager", "methods": [ { "kind": "function", "name": "EagleCudaGraphManager.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EagleCudaGraphManager.get_cudagraph_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EagleCudaGraphManager.get_cudagraph_runtime_mode", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EagleCudaGraphManager.capture_graph", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "EagleCudaGraphManager._capture_full_graph", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "EagleCudaGraphManager._capture_piecewise_graph", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "EagleCudaGraphManager.capture", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "EagleCudaGraphManager.run_fullgraph", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EagleCudaGraphManager.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleCudaGraphManager.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleCudaGraphManager.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleCudaGraphManager.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleCudaGraphManager.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleCudaGraphManager.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleCudaGraphManager.dp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleCudaGraphManager.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleCudaGraphManager.cudagraph_mode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleCudaGraphManager.graphs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "EagleCudaGraphManager.pool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 50, "n_typed": 39, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 31, "n_attrs": 11, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.spec_decode.eagle.cudagraph", "names": [ "vllm.v1.worker.gpu.spec_decode.eagle.cudagraph.EagleCudaGraphManager" ], "n_typable": 50, "n_typed": 39, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 8, "n_method_overloads": 8, "n_method_params": 31, "n_classes": 1, "n_attrs": 11, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/spec_decode/eagle/eagle3_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.spec_decode.eagle.eagle3_utils.get_eagle3_aux_layers_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.v1.worker.gpu.spec_decode.eagle.eagle3_utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.worker.gpu.spec_decode.eagle.eagle3_utils.set_eagle3_aux_hidden_state_layers", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.spec_decode.eagle.eagle3_utils", "names": [ "vllm.v1.worker.gpu.spec_decode.eagle.eagle3_utils.get_eagle3_aux_layers_from_config", "vllm.v1.worker.gpu.spec_decode.eagle.eagle3_utils.logger", "vllm.v1.worker.gpu.spec_decode.eagle.eagle3_utils.set_eagle3_aux_hidden_state_layers" ], "n_typable": 6, "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_functions": 2, "n_function_overloads": 2, "n_function_params": 3, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/spec_decode/eagle/speculator.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.spec_decode.eagle.speculator.prepare_eagle_decode", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.v1.worker.gpu.spec_decode.eagle.speculator.update_eagle_inputs", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.v1.worker.gpu.spec_decode.eagle.speculator.EagleSpeculator", "methods": [ { "kind": "function", "name": "EagleSpeculator.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "EagleSpeculator.load_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "EagleSpeculator.set_attn", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "EagleSpeculator.run_model", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "EagleSpeculator.generate_draft", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "EagleSpeculator.capture_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "EagleSpeculator.propose", "n_typed": 15, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EagleSpeculator.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.speculative_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.num_speculative_steps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.draft_model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.hidden_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.dp_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.dp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.input_buffers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.hidden_states", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.idx_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.temperature", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.seeds", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.draft_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "EagleSpeculator.cudagraph_manager", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 61, "n_typed": 38, "n_any": 0, "n_untyped": 23, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 32, "n_attrs": 22, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.worker.gpu.spec_decode.eagle.speculator.prepare_eagle_inputs", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "attr", "name": "vllm.v1.worker.gpu.spec_decode.eagle.speculator.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.spec_decode.eagle.speculator", "names": [ "vllm.v1.worker.gpu.spec_decode.eagle.speculator.EagleSpeculator", "vllm.v1.worker.gpu.spec_decode.eagle.speculator.logger", "vllm.v1.worker.gpu.spec_decode.eagle.speculator.prepare_eagle_decode", "vllm.v1.worker.gpu.spec_decode.eagle.speculator.prepare_eagle_inputs", "vllm.v1.worker.gpu.spec_decode.eagle.speculator.update_eagle_inputs" ], "n_typable": 85, "n_typed": 59, "n_any": 0, "n_untyped": 26, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 20, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 32, "n_classes": 1, "n_attrs": 23, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/spec_decode/eagle/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.spec_decode.eagle.utils.load_eagle_model", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.spec_decode.eagle.utils", "names": [ "vllm.v1.worker.gpu.spec_decode.eagle.utils.load_eagle_model" ], "n_typable": 3, "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/spec_decode/rejection_sample.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.spec_decode.rejection_sample.rejection_sample", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.spec_decode.rejection_sample", "names": [ "vllm.v1.worker.gpu.spec_decode.rejection_sample.rejection_sample" ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 4, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/spec_decode/utils.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.spec_decode.utils.DraftTokensHandler", "methods": [ { "kind": "function", "name": "DraftTokensHandler.__init__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "DraftTokensHandler.set_draft_tokens", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "DraftTokensHandler.get_draft_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "DraftTokensHandler.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DraftTokensHandler.copy_stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DraftTokensHandler.copy_event", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "DraftTokensHandler.req_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DraftTokensHandler.draft_tokens_np", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "DraftTokensHandler.num_draft_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.spec_decode.utils", "names": [ "vllm.v1.worker.gpu.spec_decode.utils.DraftTokensHandler" ], "n_typable": 12, "n_typed": 8, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 3, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/states.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.states.RequestState", "methods": [ { "kind": "function", "name": "RequestState.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "RequestState.add_request", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "RequestState.apply_staged_writes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "RequestState.remove_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "RequestState.any_prefills", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "RequestState.num_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "RequestState.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.max_num_batched_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.num_speculative_steps", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.req_id_to_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.index_to_req_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.free_indices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.all_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.prompt_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.prefill_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.total_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.num_computed_prefill_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.num_computed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.last_sampled_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.draft_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "RequestState.next_prefill_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 36, "n_typed": 19, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_attrs": 18, "n_properties": 1 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.states", "names": [ "vllm.v1.worker.gpu.states.RequestState" ], "n_typable": 36, "n_typed": 19, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 12, "n_classes": 1, "n_attrs": 18, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/structured_outputs.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu.structured_outputs.StructuredOutputsWorker", "methods": [ { "kind": "function", "name": "StructuredOutputsWorker.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "StructuredOutputsWorker.apply_grammar_bitmask", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StructuredOutputsWorker.logits_indices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputsWorker.grammar_bitmask", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputsWorker.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "StructuredOutputsWorker.copy_stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.structured_outputs", "names": [ "vllm.v1.worker.gpu.structured_outputs.StructuredOutputsWorker" ], "n_typable": 13, "n_typed": 8, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu/warmup.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu.warmup.warmup_kernels", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu.warmup", "names": [ "vllm.v1.worker.gpu.warmup.warmup_kernels" ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu_input_batch.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu_input_batch.CachedRequestState", "methods": [ { "kind": "function", "name": "CachedRequestState.__post_init__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "CachedRequestState.get_token_id", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "CachedRequestState.num_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "CachedRequestState.req_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestState.prompt_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestState.mm_features", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestState.sampling_params", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestState.generator", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestState.block_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestState.num_computed_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestState.output_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestState.mrope_positions", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestState.mrope_position_delta", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestState.xdrope_positions", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestState.lora_request", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestState.prompt_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestState.prev_num_draft_len", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestState.pooling_params", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CachedRequestState.pooling_states", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 16, "n_properties": 1 }, { "kind": "class", "name": "vllm.v1.worker.gpu_input_batch.InputBatch", "methods": [ { "kind": "function", "name": "InputBatch.__init__", "n_typed": 14, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "InputBatch._register_add_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InputBatch.add_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InputBatch.update_req_spec_token_ids", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputBatch.remove_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InputBatch.swap_states", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputBatch.condense", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InputBatch.refresh_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InputBatch._make_sampling_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InputBatch.get_pooling_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InputBatch.get_pooling_states", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InputBatch.get_pooling_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InputBatch._make_prompt_token_ids_tensor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InputBatch.make_lora_inputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputBatch.set_async_sampled_token_ids", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputBatch.update_async_output_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InputBatch.update_async_spec_token_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "InputBatch.req_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.num_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.all_greedy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.all_random", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.no_top_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.no_top_k", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.no_penalties", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.max_num_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.no_allowed_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "InputBatch.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.is_spec_decode", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.max_num_batched_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.pin_memory", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.req_id_to_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.token_ids_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.token_ids_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.is_token_ids_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.is_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.req_prompt_embeds", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.num_tokens_no_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.num_prompt_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.num_computed_tokens_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.num_computed_tokens_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.temperature", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.temperature_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.temperature_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.greedy_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.random_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_p", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_p_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_p_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_p_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_k_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_k_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_k_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.frequency_penalties", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.frequency_penalties_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.frequency_penalties_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.frequency_penalties_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.presence_penalties", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.presence_penalties_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.presence_penalties_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.presence_penalties_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.repetition_penalties", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.repetition_penalties_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.repetition_penalties_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.repetition_penalties_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.num_accepted_tokens_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.num_accepted_tokens_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.request_lora_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.lora_id_to_request_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.lora_id_to_lora_request", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.generators", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.num_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.in_progress_prompt_logprobs_cpu", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.batch_update_builder", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.has_allowed_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.allowed_token_ids_mask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.allowed_token_ids_mask_cpu_tensor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.bad_words_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.logits_processing_needs_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.req_output_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.logitsprocs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.logitsprocs_need_output_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.spec_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.sampling_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.pooling_params", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.pooling_states", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.prev_sampled_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.prev_req_id_to_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.sampled_token_ids_cpu", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.async_copy_ready_event", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 121, "n_typed": 76, "n_any": 0, "n_untyped": 45, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 26, "n_attrs": 69, "n_properties": 9 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu_input_batch", "names": [ "vllm.v1.worker.gpu_input_batch.CachedRequestState", "vllm.v1.worker.gpu_input_batch.InputBatch" ], "n_typable": 125, "n_typed": 79, "n_any": 0, "n_untyped": 46, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 27, "n_classes": 2, "n_attrs": 85, "n_properties": 10, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu_model_runner.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu_model_runner.AsyncGPUPoolingModelRunnerOutput", "methods": [ { "kind": "function", "name": "AsyncGPUPoolingModelRunnerOutput.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AsyncGPUPoolingModelRunnerOutput.get_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AsyncGPUPoolingModelRunnerOutput.async_copy_ready_event", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 7, "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 4, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.worker.gpu_model_runner.EncoderTimingStats", "methods": [ { "kind": "function", "name": "EncoderTimingStats.to_dict", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "EncoderTimingStats.encoder_forward_secs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "EncoderTimingStats.num_encoder_calls", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 1, "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.worker.gpu_model_runner.AttnMetadataDict", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.worker.gpu_model_runner.ExecuteModelState", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ExecuteModelState.scheduler_output", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecuteModelState.logits", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecuteModelState.spec_decode_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecuteModelState.spec_decode_common_attn_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecuteModelState.hidden_states", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecuteModelState.sample_hidden_states", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecuteModelState.aux_hidden_states", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecuteModelState.ec_connector_output", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecuteModelState.cudagraph_stats", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ExecuteModelState.slot_mappings", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 10, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.worker.gpu_model_runner.PerLayerAttnMetadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.worker.gpu_model_runner.AsyncGPUModelRunnerOutput", "methods": [ { "kind": "function", "name": "AsyncGPUModelRunnerOutput.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "AsyncGPUModelRunnerOutput.get_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AsyncGPUModelRunnerOutput.async_copy_ready_event", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncGPUModelRunnerOutput.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "AsyncGPUModelRunnerOutput.sampled_token_ids_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 11, "n_typed": 7, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 3, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.worker.gpu_model_runner.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.worker.gpu_model_runner.GPUModelRunner", "methods": [ { "kind": "function", "name": "GPUModelRunner.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner.update_max_model_len", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.reset_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.reset_encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.init_fp8_kv_scales", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._get_positions", "n_typed": 0, "n_any": 1, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._make_buffer", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GPUModelRunner._get_mamba_copy_bufs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._init_model_kwargs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._may_reorder_batch", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._init_kv_zero_meta", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._zero_block_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._init_device_properties", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._sync_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._update_states", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._update_states_after_model_execute", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner._update_streaming_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner._init_mrope_positions", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._init_xdrope_positions", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._extract_mm_kwargs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._dummy_mm_kwargs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._get_cumsum_and_arange", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner._prepare_input_ids", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GPUModelRunner._get_encoder_seq_lens", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPUModelRunner._prepare_inputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner._build_attention_metadata", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "GPUModelRunner._compute_cascade_attn_prefix_lens", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GPUModelRunner._compute_cascade_attn_prefix_len", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "GPUModelRunner._calc_mrope_positions", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._calc_xdrope_positions", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._calc_spec_decode_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner._prepare_kv_sharing_fast_prefill", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._batch_mm_inputs_from_scheduler", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._execute_mm_encoder", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._gather_mm_embeddings", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner.get_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.get_supported_generation_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.get_supported_pooling_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.sync_and_slice_intermediate_tensors", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GPUModelRunner.eplb_step", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner.setup_eplb_from_mapping", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner._pool", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPUModelRunner._pad_for_sequence_parallelism", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._prepare_mm_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._preprocess", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GPUModelRunner._sample", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner._bookkeeping_sync", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "GPUModelRunner.synchronize_input_prep", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._model_forward", "n_typed": 5, "n_any": 1, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "GPUModelRunner._is_uniform_decode", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "GPUModelRunner._determine_batch_execution_and_padding", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "GPUModelRunner._register_layerwise_nvtx_hooks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._get_slot_mappings", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "GPUModelRunner.execute_model", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner.sample_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._pp_broadcast_prev_sampled_token_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._pp_receive_prev_sampled_token_ids_to_input_batch", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.take_draft_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._copy_draft_token_ids_to_cpu", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner._get_draft_token_ids_cpu", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._copy_valid_sampled_token_count", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner._get_valid_sampled_token_count", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.propose_draft_token_ids", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "GPUModelRunner.update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.load_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._get_eagle3_aux_layers_from_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.reload_weights", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GPUModelRunner._get_prompt_logprobs_dict", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner._get_nans_in_logits", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.maybe_randomize_inputs", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner._get_mm_dummy_batch", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner._dummy_run", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "GPUModelRunner._dummy_sampler_run", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._dummy_pooler_run_task", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner._dummy_pooler_run", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.profile_run", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.capture_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._capture_cudagraphs", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner.initialize_attn_backend", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.initialize_metadata_builders", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner._check_and_update_cudagraph_mode", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner.calculate_reorder_batch_threshold", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.may_reinitialize_input_batch", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner._allocate_kv_cache_tensors", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner._attn_group_iterator", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._kv_cache_spec_attn_group_iterator", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._reshape_kv_cache_tensors", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "GPUModelRunner._update_hybrid_attention_mamba_layout", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.initialize_kv_cache_tensors", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "GPUModelRunner.maybe_add_kv_sharing_layers_to_kv_cache_groups", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.initialize_kv_cache", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.init_routed_experts_capturer", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._bind_routed_experts_capturer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.may_add_encoder_only_layers_to_kv_cache_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.get_kv_cache_spec", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner._to_list", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "GPUModelRunner.get_encoder_timing_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "GPUModelRunner.timed_encoder_operation", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "GPUModelRunner.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.offload_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.lora_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.load_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.speculative_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.observability_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.pin_memory", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.kv_cache_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.is_pooling_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.enable_prompt_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.is_multimodal_raw_input_only_model", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.is_multimodal_pruning_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.calculate_kv_scales", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.dcp_world_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.dcp_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.max_num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.broadcast_pp_output", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.num_query_heads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.inputs_embeds_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.attention_chunk_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.use_alibi", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.cascade_attn_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.is_mm_prefix_lm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.mm_registry", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.uses_mrope", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.uses_xdrope_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.supports_mm_inputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.use_async_scheduling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.sampler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.eplb_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.eep_eplb_suppressed", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.kv_caches", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.cross_layers_kv_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.cross_layers_attn_backend", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.attn_groups", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.use_aux_hidden_state_outputs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.num_spec_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.requests", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.num_prompt_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.comm_stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.input_batch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.async_output_copy_stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.prepare_inputs_event", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.encoder_timing_registry", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.input_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.query_start_loc", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.encoder_seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.inputs_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.is_token_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.discard_request_mask", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.num_decode_draft_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.num_accepted_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.intermediate_tensors", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.arange_np", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.shared_kv_cache_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.kv_sharing_fast_prefill_eligible_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.kv_sharing_fast_prefill_logits_indices", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.uniform_decode_query_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.cudagraph_dispatcher", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.mm_budget", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.reorder_batch_threshold", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.runner_only_attn_layers", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.transfer_event", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.sampled_token_ids_pinned_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.valid_sampled_token_count_event", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.valid_sampled_token_count_copy_stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.draft_token_ids_event", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.draft_token_ids_copy_stream", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.valid_sampled_token_count_cpu", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.draft_token_ids_cpu", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.execute_model_state", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.kv_connector_output", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.mamba_state_idx", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.layerwise_nvtx_hooks_registered", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.max_encoder_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.drafter", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.rejection_sampler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.dcp_local_seq_lens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.is_mm_embed_buffers", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.is_mm_embed_idx", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.mrope_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.xdrope_positions", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "GPUModelRunner.effective_drafter_max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 369, "n_typed": 286, "n_any": 2, "n_untyped": 81, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 99, "n_method_overloads": 99, "n_method_params": 175, "n_attrs": 95, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu_model_runner", "names": [ "vllm.v1.worker.gpu_model_runner.AsyncGPUModelRunnerOutput", "vllm.v1.worker.gpu_model_runner.AsyncGPUPoolingModelRunnerOutput", "vllm.v1.worker.gpu_model_runner.AttnMetadataDict", "vllm.v1.worker.gpu_model_runner.EncoderTimingStats", "vllm.v1.worker.gpu_model_runner.ExecuteModelState", "vllm.v1.worker.gpu_model_runner.GPUModelRunner", "vllm.v1.worker.gpu_model_runner.PerLayerAttnMetadata", "vllm.v1.worker.gpu_model_runner.logger" ], "n_typable": 391, "n_typed": 301, "n_any": 2, "n_untyped": 88, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 104, "n_method_overloads": 104, "n_method_params": 185, "n_classes": 5, "n_attrs": 114, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu_ubatch_wrapper.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.gpu_ubatch_wrapper.CUDAGraphMetaData", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CUDAGraphMetaData.cudagraph", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CUDAGraphMetaData.ubatch_metadata", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CUDAGraphMetaData.outputs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.worker.gpu_ubatch_wrapper.UBatchWrapper", "methods": [ { "kind": "function", "name": "UBatchWrapper.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "UBatchWrapper._create_sm_control_context", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UBatchWrapper.__getattr__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UBatchWrapper.unwrap", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UBatchWrapper._capture_ubatches", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "UBatchWrapper._run_ubatches", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "UBatchWrapper._make_ubatch_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "UBatchWrapper._slice_model_inputs", "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "UBatchWrapper.__call__", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "UBatchWrapper.runnable", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchWrapper.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchWrapper.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchWrapper.comm_stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchWrapper.ready_barrier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchWrapper.cudagraphs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "UBatchWrapper.cudagraph_wrapper", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchWrapper.graph_pool", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchWrapper.sm_control", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchWrapper.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 47, "n_typed": 12, "n_any": 0, "n_untyped": 35, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 28, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.worker.gpu_ubatch_wrapper.UbatchMetadata", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "UbatchMetadata.context", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UbatchMetadata.input_ids", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UbatchMetadata.positions", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UbatchMetadata.inputs_embeds", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UbatchMetadata.intermediate_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UbatchMetadata.num_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.worker.gpu_ubatch_wrapper.SMControlContextManager", "methods": [ { "kind": "function", "name": "SMControlContextManager.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SMControlContextManager.__enter__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SMControlContextManager.__exit__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SMControlContextManager.total_sms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SMControlContextManager.compute_sms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SMControlContextManager.comm_sms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SMControlContextManager.set_comm_sms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "SMControlContextManager.set_compute_sms", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 14, "n_typed": 3, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 6, "n_attrs": 5, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.worker.gpu_ubatch_wrapper.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu_ubatch_wrapper", "names": [ "vllm.v1.worker.gpu_ubatch_wrapper.CUDAGraphMetaData", "vllm.v1.worker.gpu_ubatch_wrapper.SMControlContextManager", "vllm.v1.worker.gpu_ubatch_wrapper.UBatchWrapper", "vllm.v1.worker.gpu_ubatch_wrapper.UbatchMetadata", "vllm.v1.worker.gpu_ubatch_wrapper.logger" ], "n_typable": 62, "n_typed": 15, "n_any": 0, "n_untyped": 47, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 34, "n_classes": 4, "n_attrs": 25, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/gpu_worker.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.gpu_worker.init_worker_distributed_environment", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "class", "name": "vllm.v1.worker.gpu_worker.AsyncIntermediateTensors", "methods": [ { "kind": "function", "name": "AsyncIntermediateTensors.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "AsyncIntermediateTensors.wait_for_comm", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "AsyncIntermediateTensors.__getattribute__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 4, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.worker.gpu_worker.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.worker.gpu_worker.Worker", "methods": [ { "kind": "function", "name": "Worker.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "Worker.sleep", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Worker.wake_up", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Worker._maybe_get_memory_pool_context", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Worker.initialize_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Worker.init_device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.load_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.update_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Worker.reload_weights", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Worker.determine_available_memory", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.get_kv_connector_handshake_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.get_kv_cache_spec", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.update_max_model_len", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Worker.initialize_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Worker.compile_or_warm_up_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.reset_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.reset_encoder_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.get_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.get_supported_tasks", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.get_encoder_timing_stats", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.annotate_profile", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Worker.sample_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Worker.execute_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Worker.take_draft_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.profile", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Worker.execute_dummy_batch", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.add_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Worker.remove_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Worker.list_loras", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.pin_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Worker.check_health", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.save_sharded_state", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Worker.save_tensorized_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Worker.init_weight_transfer_engine", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Worker.update_weights", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "Worker.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Worker.elastic_ep_execute", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Worker.elastic_ep_executor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Worker.weight_transfer_engine", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Worker.profiler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "Worker.profiler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "Worker.use_v2_model_runner", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 74, "n_typed": 60, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 37, "n_method_overloads": 37, "n_method_params": 32, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.gpu_worker", "names": [ "vllm.v1.worker.gpu_worker.AsyncIntermediateTensors", "vllm.v1.worker.gpu_worker.Worker", "vllm.v1.worker.gpu_worker.init_worker_distributed_environment", "vllm.v1.worker.gpu_worker.logger" ], "n_typable": 88, "n_typed": 72, "n_any": 0, "n_untyped": 16, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 5, "n_methods": 40, "n_method_overloads": 40, "n_method_params": 36, "n_classes": 2, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/kv_connector_model_runner_mixin.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.worker.kv_connector_model_runner_mixin.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.worker.kv_connector_model_runner_mixin.KVConnectorModelRunnerMixin", "methods": [ { "kind": "function", "name": "KVConnectorModelRunnerMixin.ensure_kv_transfer_shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorModelRunnerMixin.kv_connector_no_forward", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KVConnectorModelRunnerMixin.maybe_get_kv_connector_output", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KVConnectorModelRunnerMixin._get_kv_connector_output", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "KVConnectorModelRunnerMixin.clear_kv_connector_metadata", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "KVConnectorModelRunnerMixin.use_uniform_kv_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KVConnectorModelRunnerMixin.allocate_uniform_kv_caches", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 21, "n_typed": 21, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 14, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.kv_connector_model_runner_mixin", "names": [ "vllm.v1.worker.kv_connector_model_runner_mixin.KVConnectorModelRunnerMixin", "vllm.v1.worker.kv_connector_model_runner_mixin.logger" ], "n_typable": 22, "n_typed": 21, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 14, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/lora_model_runner_mixin.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.worker.lora_model_runner_mixin.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.worker.lora_model_runner_mixin.InputBatch", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.worker.lora_model_runner_mixin.LoRAModelRunnerMixin", "methods": [ { "kind": "function", "name": "LoRAModelRunnerMixin.load_lora_model", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "LoRAModelRunnerMixin._set_active_loras", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LoRAModelRunnerMixin._ensure_lora_enabled", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "LoRAModelRunnerMixin.set_active_loras", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "LoRAModelRunnerMixin.maybe_setup_dummy_loras", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "LoRAModelRunnerMixin.maybe_select_dummy_loras", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "LoRAModelRunnerMixin.maybe_dummy_run_with_lora", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "LoRAModelRunnerMixin.maybe_remove_all_loras", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelRunnerMixin.add_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelRunnerMixin.remove_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelRunnerMixin.pin_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "LoRAModelRunnerMixin.list_loras", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [], "n_typable": 40, "n_typed": 36, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 28, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.lora_model_runner_mixin", "names": [ "vllm.v1.worker.lora_model_runner_mixin.InputBatch", "vllm.v1.worker.lora_model_runner_mixin.LoRAModelRunnerMixin", "vllm.v1.worker.lora_model_runner_mixin.logger" ], "n_typable": 42, "n_typed": 37, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 28, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/mamba_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.mamba_utils.collect_mamba_copy_meta", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.v1.worker.mamba_utils.get_mamba_groups", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.worker.mamba_utils.batch_memcpy_kernel", "n_typed": 1, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "class", "name": "vllm.v1.worker.mamba_utils.MambaCopyBuffers", "methods": [ { "kind": "function", "name": "MambaCopyBuffers.create", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "MambaCopyBuffers.src_ptrs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MambaCopyBuffers.dst_ptrs", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MambaCopyBuffers.sizes", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MambaCopyBuffers.offset", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 5, "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.worker.mamba_utils.batch_memcpy", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.v1.worker.mamba_utils.preprocess_mamba", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.v1.worker.mamba_utils.do_mamba_copy_block", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.worker.mamba_utils.postprocess_mamba", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "type_ignores": [], "name": "vllm.v1.worker.mamba_utils", "names": [ "vllm.v1.worker.mamba_utils.MambaCopyBuffers", "vllm.v1.worker.mamba_utils.batch_memcpy", "vllm.v1.worker.mamba_utils.batch_memcpy_kernel", "vllm.v1.worker.mamba_utils.collect_mamba_copy_meta", "vllm.v1.worker.mamba_utils.do_mamba_copy_block", "vllm.v1.worker.mamba_utils.get_mamba_groups", "vllm.v1.worker.mamba_utils.postprocess_mamba", "vllm.v1.worker.mamba_utils.preprocess_mamba" ], "n_typable": 47, "n_typed": 36, "n_any": 0, "n_untyped": 11, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 35, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/tpu_input_batch.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.tpu_input_batch.InputBatch", "methods": [ { "kind": "function", "name": "InputBatch.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "InputBatch.add_request", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputBatch.remove_request", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InputBatch.swap_states", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "InputBatch.condense", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "InputBatch._make_prompt_token_ids_tensor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "InputBatch.make_lora_inputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [ { "kind": "property", "name": "InputBatch.req_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.num_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.all_greedy", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.all_random", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.no_top_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.no_top_k", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.no_min_p", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.no_penalties", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.max_num_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "InputBatch.no_allowed_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "InputBatch.max_num_reqs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.max_model_len", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.max_num_batched_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.pin_memory", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.vocab_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.req_id_to_index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.token_ids_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.token_ids_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.num_tokens_no_spec", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.num_prompt_tokens", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.num_computed_tokens_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.num_computed_tokens_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.block_table", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.temperature", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.temperature_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.temperature_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.greedy_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.random_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_p", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_p_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_p_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_p_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_k_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_k_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.top_k_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.min_p", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.min_p_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.min_p_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.min_p_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.frequency_penalties", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.frequency_penalties_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.frequency_penalties_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.frequency_penalties_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.presence_penalties", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.presence_penalties_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.presence_penalties_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.presence_penalties_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.repetition_penalties", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.repetition_penalties_cpu_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.repetition_penalties_cpu", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.repetition_penalties_reqs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.min_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.request_lora_mapping", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.lora_id_to_request_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.lora_id_to_lora_request", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.generators", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.num_logprobs", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.in_progress_prompt_logprobs_cpu", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.logit_bias", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.has_allowed_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.allowed_token_ids_mask", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.allowed_token_ids_mask_cpu_tensor", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.bad_words_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "InputBatch.req_output_token_ids", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 89, "n_typed": 53, "n_any": 0, "n_untyped": 36, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 16, "n_attrs": 56, "n_properties": 10 } ], "type_ignores": [], "name": "vllm.v1.worker.tpu_input_batch", "names": [ "vllm.v1.worker.tpu_input_batch.InputBatch" ], "n_typable": 89, "n_typed": 53, "n_any": 0, "n_untyped": 36, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 16, "n_classes": 1, "n_attrs": 56, "n_properties": 10, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/ubatch_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.ubatch_utils.maybe_create_ubatch_slices", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.v1.worker.ubatch_utils.split_attn_metadata", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.worker.ubatch_utils.check_ubatch_thresholds", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.v1.worker.ubatch_utils.UBatchSlices", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.worker.ubatch_utils.UBatchSlice", "methods": [ { "kind": "function", "name": "UBatchSlice.is_empty", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "UBatchSlice.num_tokens", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "UBatchSlice.request_slice", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "UBatchSlice.token_slice", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_attrs": 2, "n_properties": 1 }, { "kind": "function", "name": "vllm.v1.worker.ubatch_utils.slice_query_start_locs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.worker.ubatch_utils.is_last_ubatch_empty", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.v1.worker.ubatch_utils", "names": [ "vllm.v1.worker.ubatch_utils.UBatchSlice", "vllm.v1.worker.ubatch_utils.UBatchSlices", "vllm.v1.worker.ubatch_utils.check_ubatch_thresholds", "vllm.v1.worker.ubatch_utils.is_last_ubatch_empty", "vllm.v1.worker.ubatch_utils.maybe_create_ubatch_slices", "vllm.v1.worker.ubatch_utils.slice_query_start_locs", "vllm.v1.worker.ubatch_utils.split_attn_metadata" ], "n_typable": 24, "n_typed": 24, "n_any": 0, "n_untyped": 0, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 16, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 0, "n_classes": 1, "n_attrs": 3, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/ubatching.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.worker.ubatching.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.worker.ubatching.dbo_switch_to_comm_sync", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.worker.ubatching.UBatchContext", "methods": [ { "kind": "function", "name": "UBatchContext.__init__", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "UBatchContext.__enter__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UBatchContext.__exit__", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "UBatchContext._restore_context", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UBatchContext.update_stream", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "UBatchContext._signal_comm_done", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UBatchContext._signal_compute_done", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UBatchContext._wait_compute_done", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UBatchContext._wait_comm_done", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UBatchContext._cpu_yield", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UBatchContext.switch_to_comm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UBatchContext.switch_to_compute", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UBatchContext.switch_to_comm_sync", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UBatchContext.switch_to_compute_sync", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UBatchContext.maybe_run_recv_hook", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UBatchContext.yield_", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UBatchContext.yield_and_switch_from_compute_to_comm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "UBatchContext.yield_and_switch_from_comm_to_compute", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "UBatchContext.id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchContext.comm_stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchContext.compute_stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchContext.forward_context", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchContext.ready_barrier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchContext.cpu_wait_event", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchContext.cpu_signal_event", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchContext.current_stream", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchContext.gpu_comm_done_event", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchContext.gpu_compute_done_event", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchContext.schedule", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "UBatchContext.recv_hook", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 44, "n_typed": 10, "n_any": 0, "n_untyped": 34, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 14, "n_attrs": 12, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.worker.ubatching.dbo_switch_to_compute_sync", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.worker.ubatching.dbo_get_previous_event", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "attr", "name": "vllm.v1.worker.ubatching.dbo_switch_to_comm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.worker.ubatching.dbo_yield_and_switch_from_compute_to_comm", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.worker.ubatching.dbo_current_ubatch_id", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.v1.worker.ubatching.dbo_maybe_run_recv_hook", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.worker.ubatching.dbo_switch_to_compute", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.worker.ubatching.dbo_yield", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.worker.ubatching.dbo_register_recv_hook", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.v1.worker.ubatching.make_ubatch_contexts", "n_typed": 7, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.v1.worker.ubatching.dbo_enabled", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.v1.worker.ubatching.dbo_yield_and_switch_from_comm_to_compute", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.worker.ubatching", "names": [ "vllm.v1.worker.ubatching.UBatchContext", "vllm.v1.worker.ubatching.dbo_current_ubatch_id", "vllm.v1.worker.ubatching.dbo_enabled", "vllm.v1.worker.ubatching.dbo_get_previous_event", "vllm.v1.worker.ubatching.dbo_maybe_run_recv_hook", "vllm.v1.worker.ubatching.dbo_register_recv_hook", "vllm.v1.worker.ubatching.dbo_switch_to_comm", "vllm.v1.worker.ubatching.dbo_switch_to_comm_sync", "vllm.v1.worker.ubatching.dbo_switch_to_compute", "vllm.v1.worker.ubatching.dbo_switch_to_compute_sync", "vllm.v1.worker.ubatching.dbo_yield", "vllm.v1.worker.ubatching.dbo_yield_and_switch_from_comm_to_compute", "vllm.v1.worker.ubatching.dbo_yield_and_switch_from_compute_to_comm", "vllm.v1.worker.ubatching.logger", "vllm.v1.worker.ubatching.make_ubatch_contexts" ], "n_typable": 68, "n_typed": 19, "n_any": 0, "n_untyped": 49, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 10, "n_methods": 18, "n_method_overloads": 18, "n_method_params": 14, "n_classes": 1, "n_attrs": 21, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/utils.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.worker.utils.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "function", "name": "vllm.v1.worker.utils.sanity_check_mm_encoder_outputs", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.worker.utils.prepare_kernel_block_sizes", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.worker.utils.is_residual_scattered_for_sp", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.worker.utils.select_common_block_size", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.v1.worker.utils.AttentionGroup", "methods": [ { "kind": "function", "name": "AttentionGroup.create_metadata_builders", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "AttentionGroup.get_metadata_builder", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "AttentionGroup.backend", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionGroup.layer_names", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionGroup.kv_cache_spec", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionGroup.kv_cache_group_id", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionGroup.metadata_builders", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 7, "n_typed": 4, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.v1.worker.utils.KVBlockZeroer", "methods": [ { "kind": "function", "name": "KVBlockZeroer.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "KVBlockZeroer.init_meta", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "KVBlockZeroer.zero_block_ids", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "KVBlockZeroer.device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "KVBlockZeroer.pin_memory", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 13, "n_typed": 10, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 8, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.worker.utils.bind_kv_cache", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.v1.worker.utils.request_memory", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.v1.worker.utils.add_kv_sharing_layers_to_kv_cache_groups", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.v1.worker.utils", "names": [ "vllm.v1.worker.utils.AttentionGroup", "vllm.v1.worker.utils.KVBlockZeroer", "vllm.v1.worker.utils.add_kv_sharing_layers_to_kv_cache_groups", "vllm.v1.worker.utils.bind_kv_cache", "vllm.v1.worker.utils.is_residual_scattered_for_sp", "vllm.v1.worker.utils.logger", "vllm.v1.worker.utils.prepare_kernel_block_sizes", "vllm.v1.worker.utils.request_memory", "vllm.v1.worker.utils.sanity_check_mm_encoder_outputs", "vllm.v1.worker.utils.select_common_block_size" ], "n_typable": 45, "n_typed": 38, "n_any": 0, "n_untyped": 7, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 17, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 13, "n_classes": 2, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/worker_base.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.worker_base.WorkerWrapperBase", "methods": [ { "kind": "function", "name": "WorkerWrapperBase.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WorkerWrapperBase.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerWrapperBase.adjust_rank", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerWrapperBase.update_environment_variables", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerWrapperBase.init_worker", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerWrapperBase.initialize_from_config", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerWrapperBase.init_device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerWrapperBase.execute_method", "n_typed": 1, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "WorkerWrapperBase.__getattr__", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerWrapperBase._apply_mm_cache", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerWrapperBase.execute_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerWrapperBase.reset_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "WorkerWrapperBase.rpc_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerWrapperBase.global_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerWrapperBase.worker", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "WorkerWrapperBase.vllm_config", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 28, "n_typed": 21, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 12, "n_method_overloads": 12, "n_method_params": 12, "n_attrs": 4, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.worker.worker_base.ModelRunnerOutput", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "class", "name": "vllm.v1.worker.worker_base.WorkerBase", "methods": [ { "kind": "function", "name": "WorkerBase.__init__", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "WorkerBase.get_kv_cache_spec", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerBase.compile_or_warm_up_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerBase.check_health", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerBase.init_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerBase.initialize_cache", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WorkerBase.reset_mm_cache", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerBase.get_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerBase.apply_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerBase.get_model_inspection", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerBase.load_model", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerBase.execute_model", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerBase.sample_tokens", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerBase.get_cache_block_size_bytes", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerBase.add_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerBase.remove_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerBase.pin_lora", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkerBase.list_loras", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkerBase.shutdown", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [ { "kind": "property", "name": "WorkerBase.vocab_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "WorkerBase.vllm_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.model_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.cache_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.lora_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.load_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.parallel_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.scheduler_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.device_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.speculative_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.observability_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.kv_transfer_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.compilation_config", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.current_platform", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.local_rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.rank", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.distributed_init_method", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.is_driver_worker", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "WorkerBase.model_runner", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 52, "n_typed": 35, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 19, "n_method_overloads": 19, "n_method_params": 13, "n_attrs": 19, "n_properties": 1 }, { "kind": "attr", "name": "vllm.v1.worker.worker_base.AsyncModelRunnerOutput", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.worker.worker_base.SchedulerOutput", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.v1.worker.worker_base.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.v1.worker.worker_base.GrammarOutput", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.worker_base", "names": [ "vllm.v1.worker.worker_base.AsyncModelRunnerOutput", "vllm.v1.worker.worker_base.GrammarOutput", "vllm.v1.worker.worker_base.ModelRunnerOutput", "vllm.v1.worker.worker_base.SchedulerOutput", "vllm.v1.worker.worker_base.WorkerBase", "vllm.v1.worker.worker_base.WorkerWrapperBase", "vllm.v1.worker.worker_base.logger" ], "n_typable": 81, "n_typed": 56, "n_any": 0, "n_untyped": 25, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 31, "n_method_overloads": 31, "n_method_params": 25, "n_classes": 2, "n_attrs": 28, "n_properties": 1, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/workspace.py", "symbol_reports": [ { "kind": "function", "name": "vllm.v1.worker.workspace.is_workspace_manager_initialized", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.v1.worker.workspace.init_workspace_manager", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.v1.worker.workspace.WorkspaceManager", "methods": [ { "kind": "function", "name": "WorkspaceManager.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "WorkspaceManager._workspace_size_bytes", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkspaceManager.lock", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkspaceManager.unlock", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkspaceManager.is_locked", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "WorkspaceManager.get_simultaneous", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "WorkspaceManager._ensure_workspace_size", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 12, "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.v1.worker.workspace.unlock_workspace", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.v1.worker.workspace.lock_workspace", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.v1.worker.workspace.reset_workspace_manager", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "vllm.v1.worker.workspace.current_workspace_manager", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.v1.worker.workspace.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.worker.workspace", "names": [ "vllm.v1.worker.workspace.WorkspaceManager", "vllm.v1.worker.workspace.current_workspace_manager", "vllm.v1.worker.workspace.init_workspace_manager", "vllm.v1.worker.workspace.is_workspace_manager_initialized", "vllm.v1.worker.workspace.lock_workspace", "vllm.v1.worker.workspace.logger", "vllm.v1.worker.workspace.reset_workspace_manager", "vllm.v1.worker.workspace.unlock_workspace" ], "n_typable": 21, "n_typed": 19, "n_any": 0, "n_untyped": 2, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 2, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 5, "n_classes": 1, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/xpu_model_runner.py", "symbol_reports": [ { "kind": "class", "name": "vllm.v1.worker.xpu_model_runner.XPUModelRunner", "methods": [ { "kind": "function", "name": "XPUModelRunner.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "XPUModelRunner._sync_device", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "XPUModelRunner.cascade_attn_enabled", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 5, "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_attrs": 1, "n_properties": 0 }, { "kind": "attr", "name": "vllm.v1.worker.xpu_model_runner.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.v1.worker.xpu_model_runner", "names": [ "vllm.v1.worker.xpu_model_runner.XPUModelRunner", "vllm.v1.worker.xpu_model_runner.logger" ], "n_typable": 6, "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 2, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/v1/worker/xpu_worker.py", "symbol_reports": [ { "kind": "attr", "name": "vllm.v1.worker.xpu_worker.logger", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "class", "name": "vllm.v1.worker.xpu_worker.XPUWorker", "methods": [ { "kind": "function", "name": "XPUWorker.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "XPUWorker.init_device", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "XPUWorker.profiler", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 8, "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.v1.worker.xpu_worker", "names": [ "vllm.v1.worker.xpu_worker.XPUWorker", "vllm.v1.worker.xpu_worker.logger" ], "n_typable": 9, "n_typed": 6, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_classes": 1, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/flash_attn_interface.py", "symbol_reports": [ { "kind": "function", "name": "vllm.vllm_flash_attn.flash_attn_interface.is_fa_version_supported", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.vllm_flash_attn.flash_attn_interface.flash_attn_varlen_func", "n_typed": 3, "n_any": 0, "n_untyped": 28, "n_overloads": 1, "n_typable": 31, "n_params": 30, "n_function_overloads": 1, "n_function_params": 30 }, { "kind": "function", "name": "vllm.vllm_flash_attn.flash_attn_interface.get_scheduler_metadata", "n_typed": 5, "n_any": 0, "n_untyped": 16, "n_overloads": 1, "n_typable": 21, "n_params": 20, "n_function_overloads": 1, "n_function_params": 20 }, { "kind": "function", "name": "vllm.vllm_flash_attn.flash_attn_interface.fa_version_unsupported_reason", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.vllm_flash_attn.flash_attn_interface.sparse_attn_varlen_func", "n_typed": 0, "n_any": 0, "n_untyped": 21, "n_overloads": 1, "n_typable": 21, "n_params": 20, "n_function_overloads": 1, "n_function_params": 20 }, { "kind": "attr", "name": "vllm.vllm_flash_attn.flash_attn_interface.FA4_AVAILABLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.vllm_flash_attn.flash_attn_interface.DEFAULT_FA_VERSION", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.flash_attn_interface.sparse_attn_func", "n_typed": 0, "n_any": 0, "n_untyped": 17, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "attr", "name": "vllm.vllm_flash_attn.flash_attn_interface.FA3_AVAILABLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.flash_attn_interface.maybe_contiguous", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.vllm_flash_attn.flash_attn_interface.FA2_UNAVAILABLE_REASON", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.vllm_flash_attn.flash_attn_interface.FA2_AVAILABLE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.vllm_flash_attn.flash_attn_interface.FA3_UNAVAILABLE_REASON", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.vllm_flash_attn.flash_attn_interface.FA4_UNAVAILABLE_REASON", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "type_ignores": [ { "kind": "type", "rules": [ "attr-defined" ] }, { "kind": "type", "rules": [ "attr-defined" ] } ], "name": "vllm.vllm_flash_attn.flash_attn_interface", "names": [ "vllm.vllm_flash_attn.flash_attn_interface.DEFAULT_FA_VERSION", "vllm.vllm_flash_attn.flash_attn_interface.FA2_AVAILABLE", "vllm.vllm_flash_attn.flash_attn_interface.FA2_UNAVAILABLE_REASON", "vllm.vllm_flash_attn.flash_attn_interface.FA3_AVAILABLE", "vllm.vllm_flash_attn.flash_attn_interface.FA3_UNAVAILABLE_REASON", "vllm.vllm_flash_attn.flash_attn_interface.FA4_AVAILABLE", "vllm.vllm_flash_attn.flash_attn_interface.FA4_UNAVAILABLE_REASON", "vllm.vllm_flash_attn.flash_attn_interface.fa_version_unsupported_reason", "vllm.vllm_flash_attn.flash_attn_interface.flash_attn_varlen_func", "vllm.vllm_flash_attn.flash_attn_interface.get_scheduler_metadata", "vllm.vllm_flash_attn.flash_attn_interface.is_fa_version_supported", "vllm.vllm_flash_attn.flash_attn_interface.maybe_contiguous", "vllm.vllm_flash_attn.flash_attn_interface.sparse_attn_func", "vllm.vllm_flash_attn.flash_attn_interface.sparse_attn_varlen_func" ], "n_typable": 96, "n_typed": 12, "n_any": 0, "n_untyped": 84, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 89, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 2 }, { "path": "vllm/vllm_flash_attn/cute/interface.py", "symbol_reports": [ { "kind": "function", "name": "vllm.vllm_flash_attn.cute.interface.flash_attn_func", "n_typed": 17, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.interface.flash_attn_varlen_func", "n_typed": 20, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 21, "n_params": 20, "n_function_overloads": 1, "n_function_params": 20 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.interface.FlashAttnFunc", "methods": [ { "kind": "function", "name": "FlashAttnFunc.forward", "n_typed": 17, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 }, { "kind": "function", "name": "FlashAttnFunc.backward", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 23, "n_typed": 17, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 21, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.interface.num_splits_heuristic", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.interface.maybe_contiguous", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.interface.FlashAttnVarlenFunc", "methods": [ { "kind": "function", "name": "FlashAttnVarlenFunc.forward", "n_typed": 20, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 22, "n_params": 21, "n_function_overloads": 1, "n_function_params": 21 }, { "kind": "function", "name": "FlashAttnVarlenFunc.backward", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [], "n_typable": 26, "n_typed": 20, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 24, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.vllm_flash_attn.cute.interface.torch2cute_dtype_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.interface.flash_attn_combine", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.interface", "names": [ "vllm.vllm_flash_attn.cute.interface.FlashAttnFunc", "vllm.vllm_flash_attn.cute.interface.FlashAttnVarlenFunc", "vllm.vllm_flash_attn.cute.interface.flash_attn_combine", "vllm.vllm_flash_attn.cute.interface.flash_attn_func", "vllm.vllm_flash_attn.cute.interface.flash_attn_varlen_func", "vllm.vllm_flash_attn.cute.interface.maybe_contiguous", "vllm.vllm_flash_attn.cute.interface.num_splits_heuristic", "vllm.vllm_flash_attn.cute.interface.torch2cute_dtype_map" ], "n_typable": 103, "n_typed": 82, "n_any": 0, "n_untyped": 21, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 49, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 45, "n_classes": 2, "n_attrs": 1, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/ampere_helpers.py", "symbol_reports": [ { "kind": "function", "name": "vllm.vllm_flash_attn.cute.ampere_helpers.get_smem_layout_atom", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.ampere_helpers.gemm_rs", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.ampere_helpers.gemm", "n_typed": 13, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.ampere_helpers", "names": [ "vllm.vllm_flash_attn.cute.ampere_helpers.gemm", "vllm.vllm_flash_attn.cute.ampere_helpers.gemm_rs", "vllm.vllm_flash_attn.cute.ampere_helpers.get_smem_layout_atom" ], "n_typable": 24, "n_typed": 24, "n_any": 0, "n_untyped": 0, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 21, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/barrier.py", "symbol_reports": [ { "kind": "function", "name": "vllm.vllm_flash_attn.cute.barrier.red_release", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.barrier.arrive_inc", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.barrier.red_relaxed", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.barrier.ld_acquire", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.barrier.wait_eq", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.barrier", "names": [ "vllm.vllm_flash_attn.cute.barrier.arrive_inc", "vllm.vllm_flash_attn.cute.barrier.ld_acquire", "vllm.vllm_flash_attn.cute.barrier.red_relaxed", "vllm.vllm_flash_attn.cute.barrier.red_release", "vllm.vllm_flash_attn.cute.barrier.wait_eq" ], "n_typable": 24, "n_typed": 18, "n_any": 0, "n_untyped": 6, "n_functions": 5, "n_function_overloads": 5, "n_function_params": 19, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/benchmark.py", "symbol_reports": [ { "kind": "function", "name": "vllm.vllm_flash_attn.cute.benchmark.benchmark_fwd_bwd", "n_typed": 0, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.benchmark.benchmark_backward", "n_typed": 0, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.benchmark.benchmark_memory", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.benchmark.pytorch_profiler", "n_typed": 0, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.benchmark.benchmark_combined", "n_typed": 0, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.benchmark.benchmark_all", "n_typed": 0, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.benchmark.benchmark_forward", "n_typed": 0, "n_any": 0, "n_untyped": 9, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.benchmark", "names": [ "vllm.vllm_flash_attn.cute.benchmark.benchmark_all", "vllm.vllm_flash_attn.cute.benchmark.benchmark_backward", "vllm.vllm_flash_attn.cute.benchmark.benchmark_combined", "vllm.vllm_flash_attn.cute.benchmark.benchmark_forward", "vllm.vllm_flash_attn.cute.benchmark.benchmark_fwd_bwd", "vllm.vllm_flash_attn.cute.benchmark.benchmark_memory", "vllm.vllm_flash_attn.cute.benchmark.pytorch_profiler" ], "n_typable": 65, "n_typed": 0, "n_any": 0, "n_untyped": 65, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 58, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/blackwell_helpers.py", "symbol_reports": [ { "kind": "function", "name": "vllm.vllm_flash_attn.cute.blackwell_helpers.gemm", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.blackwell_helpers.gemm_w_idx", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.blackwell_helpers.gemm_ptx", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.blackwell_helpers.gemm_ptx_loop", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.blackwell_helpers.gemm_ptx_w_idx", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.blackwell_helpers.gemm_ptx_partial1", "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.blackwell_helpers.gemm_ptx_partial", "n_typed": 11, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.blackwell_helpers.i64_to_i32x2", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.blackwell_helpers", "names": [ "vllm.vllm_flash_attn.cute.blackwell_helpers.gemm", "vllm.vllm_flash_attn.cute.blackwell_helpers.gemm_ptx", "vllm.vllm_flash_attn.cute.blackwell_helpers.gemm_ptx_loop", "vllm.vllm_flash_attn.cute.blackwell_helpers.gemm_ptx_partial", "vllm.vllm_flash_attn.cute.blackwell_helpers.gemm_ptx_partial1", "vllm.vllm_flash_attn.cute.blackwell_helpers.gemm_ptx_w_idx", "vllm.vllm_flash_attn.cute.blackwell_helpers.gemm_w_idx", "vllm.vllm_flash_attn.cute.blackwell_helpers.i64_to_i32x2" ], "n_typable": 71, "n_typed": 70, "n_any": 0, "n_untyped": 1, "n_functions": 8, "n_function_overloads": 8, "n_function_params": 63, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/block_info.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.block_info.BlockInfo", "methods": [ { "kind": "function", "name": "BlockInfo.get_n_block_min_max", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BlockInfo.get_m_block_min_max", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "BlockInfo.get_n_block_min_causal_local_mask", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "BlockInfo.get_n_block_min_before_local_mask", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlockInfo.tile_m", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlockInfo.tile_n", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlockInfo.is_causal", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlockInfo.is_local", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlockInfo.is_split_kv", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlockInfo.window_size_left", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlockInfo.window_size_right", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlockInfo.qhead_per_kvhead_packgqa", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.block_info", "names": [ "vllm.vllm_flash_attn.cute.block_info.BlockInfo" ], "n_typable": 16, "n_typed": 16, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 12, "n_classes": 1, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/block_sparse_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.handle_block_sparse_empty_tile_correction_sm100", "n_typed": 28, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 34, "n_params": 33, "n_function_overloads": 1, "n_function_params": 33 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.dQaccum_store_block_sparse_bwd_sm90", "n_typed": 7, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.produce_block_sparse_loads_sm100", "n_typed": 5, "n_any": 0, "n_untyped": 9, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.consume_block_sparse_loads", "n_typed": 6, "n_any": 0, "n_untyped": 15, "n_overloads": 1, "n_typable": 21, "n_params": 20, "n_function_overloads": 1, "n_function_params": 20 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.produce_block_sparse_q_loads_bwd_sm100", "n_typed": 5, "n_any": 0, "n_untyped": 21, "n_overloads": 1, "n_typable": 26, "n_params": 25, "n_function_overloads": 1, "n_function_params": 25 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.consume_block_sparse_mma_bwd_sm90", "n_typed": 5, "n_any": 0, "n_untyped": 14, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.get_total_q_block_count_bwd", "n_typed": 3, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.sparse_tensor_m_block", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.load_block_list_sm100", "n_typed": 3, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.produce_block_sparse_loads", "n_typed": 6, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.load_block_list", "n_typed": 6, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.get_total_block_count", "n_typed": 3, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.softmax_block_sparse_sm100", "n_typed": 16, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 21, "n_params": 20, "n_function_overloads": 1, "n_function_params": 20 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.get_block_sparse_iteration_info_bwd", "n_typed": 3, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.get_m_block_from_iter_bwd", "n_typed": 4, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.finish_overlap_v_load", "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparse_utils.produce_block_sparse_q_loads_bwd_sm90", "n_typed": 4, "n_any": 0, "n_untyped": 16, "n_overloads": 1, "n_typable": 20, "n_params": 19, "n_function_overloads": 1, "n_function_params": 19 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.block_sparse_utils", "names": [ "vllm.vllm_flash_attn.cute.block_sparse_utils.consume_block_sparse_loads", "vllm.vllm_flash_attn.cute.block_sparse_utils.consume_block_sparse_mma_bwd_sm90", "vllm.vllm_flash_attn.cute.block_sparse_utils.dQaccum_store_block_sparse_bwd_sm90", "vllm.vllm_flash_attn.cute.block_sparse_utils.finish_overlap_v_load", "vllm.vllm_flash_attn.cute.block_sparse_utils.get_block_sparse_iteration_info_bwd", "vllm.vllm_flash_attn.cute.block_sparse_utils.get_m_block_from_iter_bwd", "vllm.vllm_flash_attn.cute.block_sparse_utils.get_total_block_count", "vllm.vllm_flash_attn.cute.block_sparse_utils.get_total_q_block_count_bwd", "vllm.vllm_flash_attn.cute.block_sparse_utils.handle_block_sparse_empty_tile_correction_sm100", "vllm.vllm_flash_attn.cute.block_sparse_utils.load_block_list", "vllm.vllm_flash_attn.cute.block_sparse_utils.load_block_list_sm100", "vllm.vllm_flash_attn.cute.block_sparse_utils.produce_block_sparse_loads", "vllm.vllm_flash_attn.cute.block_sparse_utils.produce_block_sparse_loads_sm100", "vllm.vllm_flash_attn.cute.block_sparse_utils.produce_block_sparse_q_loads_bwd_sm100", "vllm.vllm_flash_attn.cute.block_sparse_utils.produce_block_sparse_q_loads_bwd_sm90", "vllm.vllm_flash_attn.cute.block_sparse_utils.softmax_block_sparse_sm100", "vllm.vllm_flash_attn.cute.block_sparse_utils.sparse_tensor_m_block" ], "n_typable": 247, "n_typed": 107, "n_any": 0, "n_untyped": 140, "n_functions": 17, "n_function_overloads": 17, "n_function_params": 230, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/block_sparsity.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.block_sparsity.BlockSparseTensors", "methods": [ { "kind": "function", "name": "BlockSparseTensors.__new_from_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlockSparseTensors.mask_block_cnt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlockSparseTensors.mask_block_idx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlockSparseTensors.full_block_cnt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlockSparseTensors.full_block_idx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 2, "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparsity.normalize_block_sparse_tensors", "n_typed": 6, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparsity.get_block_sparse_expected_shapes_bwd", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparsity.fast_sampling", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparsity.get_block_sparse_broadcast_pattern", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparsity.normalize_block_sparse_config", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparsity.to_cute_block_sparse_tensors", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparsity.infer_block_sparse_expected_shapes", "n_typed": 12, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.block_sparsity.BlockSparseTensorsTorch", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "BlockSparseTensorsTorch.mask_block_cnt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlockSparseTensorsTorch.mask_block_idx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlockSparseTensorsTorch.full_block_cnt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlockSparseTensorsTorch.full_block_idx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "BlockSparseTensorsTorch.block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparsity.get_block_sparse_expected_shapes", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparsity.ceildiv", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparsity.is_block_sparsity_enabled", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.block_sparsity.normalize_block_sparse_config_bwd", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.block_sparsity", "names": [ "vllm.vllm_flash_attn.cute.block_sparsity.BlockSparseTensors", "vllm.vllm_flash_attn.cute.block_sparsity.BlockSparseTensorsTorch", "vllm.vllm_flash_attn.cute.block_sparsity.ceildiv", "vllm.vllm_flash_attn.cute.block_sparsity.fast_sampling", "vllm.vllm_flash_attn.cute.block_sparsity.get_block_sparse_broadcast_pattern", "vllm.vllm_flash_attn.cute.block_sparsity.get_block_sparse_expected_shapes", "vllm.vllm_flash_attn.cute.block_sparsity.get_block_sparse_expected_shapes_bwd", "vllm.vllm_flash_attn.cute.block_sparsity.infer_block_sparse_expected_shapes", "vllm.vllm_flash_attn.cute.block_sparsity.is_block_sparsity_enabled", "vllm.vllm_flash_attn.cute.block_sparsity.normalize_block_sparse_config", "vllm.vllm_flash_attn.cute.block_sparsity.normalize_block_sparse_config_bwd", "vllm.vllm_flash_attn.cute.block_sparsity.normalize_block_sparse_tensors", "vllm.vllm_flash_attn.cute.block_sparsity.to_cute_block_sparse_tensors" ], "n_typable": 64, "n_typed": 60, "n_any": 0, "n_untyped": 4, "n_functions": 11, "n_function_overloads": 11, "n_function_params": 51, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_classes": 2, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/compute_block_sparsity.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.compute_block_sparsity.BlockSparsityKernel", "methods": [ { "kind": "function", "name": "BlockSparsityKernel.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "BlockSparsityKernel.__call__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "BlockSparsityKernel.kernel", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "BlockSparsityKernel.mask_mod", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockSparsityKernel.tile_mn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockSparsityKernel.compute_full_blocks", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockSparsityKernel.use_aux_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "BlockSparsityKernel.use_fast_sampling", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 25, "n_typed": 17, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 17, "n_attrs": 5, "n_properties": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.compute_block_sparsity.compute_block_sparsity", "n_typed": 5, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.compute_block_sparsity", "names": [ "vllm.vllm_flash_attn.cute.compute_block_sparsity.BlockSparsityKernel", "vllm.vllm_flash_attn.cute.compute_block_sparsity.compute_block_sparsity" ], "n_typable": 37, "n_typed": 22, "n_any": 0, "n_untyped": 15, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 11, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 17, "n_classes": 1, "n_attrs": 5, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/copy_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.vllm_flash_attn.cute.copy_utils.cpasync_bulk_g2s", "n_typed": 4, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.copy_utils.set_block_rank", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.copy_utils.tiled_copy_2d", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.copy_utils.cpasync_reduce_bulk_add_f32", "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.copy_utils.cpasync_bulk_get_copy_fn", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.copy_utils.atomic_add_fp32x4", "n_typed": 6, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.copy_utils.tma_get_copy_fn", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.copy_utils.tma_producer_copy_fn", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.copy_utils.cvt_copy", "n_typed": 5, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.copy_utils.store_shared_remote_fp32x4", "n_typed": 8, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.copy_utils.get_copy_atom", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.copy_utils.tiled_copy_1d", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.copy_utils.copy", "n_typed": 6, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.copy_utils.make_tmem_copy", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.copy_utils.load_s2r", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.copy_utils", "names": [ "vllm.vllm_flash_attn.cute.copy_utils.atomic_add_fp32x4", "vllm.vllm_flash_attn.cute.copy_utils.copy", "vllm.vllm_flash_attn.cute.copy_utils.cpasync_bulk_g2s", "vllm.vllm_flash_attn.cute.copy_utils.cpasync_bulk_get_copy_fn", "vllm.vllm_flash_attn.cute.copy_utils.cpasync_reduce_bulk_add_f32", "vllm.vllm_flash_attn.cute.copy_utils.cvt_copy", "vllm.vllm_flash_attn.cute.copy_utils.get_copy_atom", "vllm.vllm_flash_attn.cute.copy_utils.load_s2r", "vllm.vllm_flash_attn.cute.copy_utils.make_tmem_copy", "vllm.vllm_flash_attn.cute.copy_utils.set_block_rank", "vllm.vllm_flash_attn.cute.copy_utils.store_shared_remote_fp32x4", "vllm.vllm_flash_attn.cute.copy_utils.tiled_copy_1d", "vllm.vllm_flash_attn.cute.copy_utils.tiled_copy_2d", "vllm.vllm_flash_attn.cute.copy_utils.tma_get_copy_fn", "vllm.vllm_flash_attn.cute.copy_utils.tma_producer_copy_fn" ], "n_typable": 95, "n_typed": 68, "n_any": 0, "n_untyped": 27, "n_functions": 15, "n_function_overloads": 15, "n_function_params": 80, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/cute_dsl_ptxas.py", "symbol_reports": [ { "kind": "function", "name": "vllm.vllm_flash_attn.cute.cute_dsl_ptxas.patch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "attr", "name": "vllm.vllm_flash_attn.cute.cute_dsl_ptxas.CUTE_DSL_PTXAS_PATH", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "vllm.vllm_flash_attn.cute.cute_dsl_ptxas.VERBOSE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.cute_dsl_ptxas", "names": [ "vllm.vllm_flash_attn.cute.cute_dsl_ptxas.CUTE_DSL_PTXAS_PATH", "vllm.vllm_flash_attn.cute.cute_dsl_ptxas.VERBOSE", "vllm.vllm_flash_attn.cute.cute_dsl_ptxas.patch" ], "n_typable": 3, "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 2, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/cute_dsl_utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.vllm_flash_attn.cute.cute_dsl_utils.load_cubin_module_data_patched", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.cute_dsl_utils.cute_compile_patched", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.cute_dsl_utils.assume_tensor_aligned", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.cute_dsl_utils.ParamsBase", "methods": [ { "kind": "function", "name": "ParamsBase.__extract_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParamsBase.__new_from_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.cute_dsl_utils.get_max_active_clusters", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.cute_dsl_utils.get_device_capacity", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.cute_dsl_utils.get_broadcast_dims", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.cute_dsl_utils.ArgumentsBase", "methods": [ { "kind": "function", "name": "ArgumentsBase.__c_pointers__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ArgumentsBase.__get_mlir_types__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ArgumentsBase.__new_from_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 4, "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "attr", "name": "vllm.vllm_flash_attn.cute.cute_dsl_utils.torch2cute_dtype_map", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "vllm.vllm_flash_attn.cute.cute_dsl_utils.extract", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.cute_dsl_utils.to_cute_tensor", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.cute_dsl_utils.assume_strides_aligned", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "attr", "name": "vllm.vllm_flash_attn.cute.cute_dsl_utils.StaticTypes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.cute_dsl_utils", "names": [ "vllm.vllm_flash_attn.cute.cute_dsl_utils.ArgumentsBase", "vllm.vllm_flash_attn.cute.cute_dsl_utils.ParamsBase", "vllm.vllm_flash_attn.cute.cute_dsl_utils.StaticTypes", "vllm.vllm_flash_attn.cute.cute_dsl_utils.assume_strides_aligned", "vllm.vllm_flash_attn.cute.cute_dsl_utils.assume_tensor_aligned", "vllm.vllm_flash_attn.cute.cute_dsl_utils.cute_compile_patched", "vllm.vllm_flash_attn.cute.cute_dsl_utils.extract", "vllm.vllm_flash_attn.cute.cute_dsl_utils.get_broadcast_dims", "vllm.vllm_flash_attn.cute.cute_dsl_utils.get_device_capacity", "vllm.vllm_flash_attn.cute.cute_dsl_utils.get_max_active_clusters", "vllm.vllm_flash_attn.cute.cute_dsl_utils.load_cubin_module_data_patched", "vllm.vllm_flash_attn.cute.cute_dsl_utils.to_cute_tensor", "vllm.vllm_flash_attn.cute.cute_dsl_utils.torch2cute_dtype_map" ], "n_typable": 30, "n_typed": 4, "n_any": 0, "n_untyped": 26, "n_functions": 8, "n_function_overloads": 8, "n_function_params": 14, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 2, "n_classes": 2, "n_attrs": 3, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/fast_math.py", "symbol_reports": [ { "kind": "function", "name": "vllm.vllm_flash_attn.cute.fast_math.clz", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.fast_math", "names": [ "vllm.vllm_flash_attn.cute.fast_math.clz" ], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 1, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/flash_bwd.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.flash_bwd.FlashAttentionBackwardSm80", "methods": [ { "kind": "function", "name": "FlashAttentionBackwardSm80.__init__", "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 }, { "kind": "function", "name": "FlashAttentionBackwardSm80.can_implement", "n_typed": 1, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "FlashAttentionBackwardSm80._check_type", "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "FlashAttentionBackwardSm80._setup_attributes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackwardSm80._get_tiled_mma", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackwardSm80._get_shared_storage_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackwardSm80.__call__", "n_typed": 19, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 20, "n_params": 19, "n_function_overloads": 1, "n_function_params": 19 }, { "kind": "function", "name": "FlashAttentionBackwardSm80.kernel", "n_typed": 34, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 35, "n_params": 34, "n_function_overloads": 1, "n_function_params": 34 }, { "kind": "function", "name": "FlashAttentionBackwardSm80.compute_one_m_block", "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "FlashAttentionBackwardSm80.epilogue", "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "FlashAttentionBackwardSm80.advance_pipeline", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "FlashAttentionBackwardSm80.load_K", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FlashAttentionBackwardSm80.load_V", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FlashAttentionBackwardSm80.load_Q_LSE", "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "FlashAttentionBackwardSm80.load_dO_dPsum", "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttentionBackwardSm80.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.head_dim_padded", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.same_hdim_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.head_dim_v_padded", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.check_hdim_oob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.check_hdim_v_oob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.qhead_per_kvhead", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.m_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.n_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.num_threads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.pack_gqa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.is_causal", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.num_stages_Q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.num_stages_dO", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.SdP_swapAB", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.dKV_swapAB", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.dQ_swapAB", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.AtomLayoutMSdP", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.AtomLayoutNdKV", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.AtomLayoutMdQ", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.Mma_dKV_is_RS", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.V_in_regs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm80.share_QV_smem", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 201, "n_typed": 153, "n_any": 0, "n_untyped": 48, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 163, "n_attrs": 23, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.flash_bwd", "names": [ "vllm.vllm_flash_attn.cute.flash_bwd.FlashAttentionBackwardSm80" ], "n_typable": 201, "n_typed": 153, "n_any": 0, "n_untyped": 48, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 163, "n_classes": 1, "n_attrs": 23, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/flash_bwd_postprocess.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.flash_bwd_postprocess.FlashAttentionBackwardPostprocess", "methods": [ { "kind": "function", "name": "FlashAttentionBackwardPostprocess.__init__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "FlashAttentionBackwardPostprocess.can_implement", "n_typed": 1, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashAttentionBackwardPostprocess._get_tiled_mma", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackwardPostprocess._setup_attributes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackwardPostprocess.__call__", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FlashAttentionBackwardPostprocess.kernel", "n_typed": 14, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttentionBackwardPostprocess.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardPostprocess.tile_m", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardPostprocess.arch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardPostprocess.tile_hdim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardPostprocess.check_hdim_oob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardPostprocess.num_threads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardPostprocess.AtomLayoutMdQ", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardPostprocess.dQ_swapAB", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 45, "n_typed": 28, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 31, "n_attrs": 8, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.flash_bwd_postprocess", "names": [ "vllm.vllm_flash_attn.cute.flash_bwd_postprocess.FlashAttentionBackwardPostprocess" ], "n_typable": 45, "n_typed": 28, "n_any": 0, "n_untyped": 17, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 31, "n_classes": 1, "n_attrs": 8, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/flash_bwd_preprocess.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.flash_bwd_preprocess.FlashAttentionBackwardPreprocess", "methods": [ { "kind": "function", "name": "FlashAttentionBackwardPreprocess.__init__", "n_typed": 5, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "FlashAttentionBackwardPreprocess.can_implement", "n_typed": 1, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashAttentionBackwardPreprocess._setup_attributes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackwardPreprocess.__call__", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "FlashAttentionBackwardPreprocess.kernel", "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttentionBackwardPreprocess.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardPreprocess.m_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardPreprocess.arch", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardPreprocess.head_dim_padded", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardPreprocess.check_hdim_oob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardPreprocess.num_threads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 41, "n_typed": 27, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 30, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.flash_bwd_preprocess", "names": [ "vllm.vllm_flash_attn.cute.flash_bwd_preprocess.FlashAttentionBackwardPreprocess" ], "n_typable": 41, "n_typed": 27, "n_any": 0, "n_untyped": 14, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 30, "n_classes": 1, "n_attrs": 6, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/flash_bwd_sm100.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.flash_bwd_sm100.FlashAttentionBackwardSm100", "methods": [ { "kind": "function", "name": "FlashAttentionBackwardSm100.__init__", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "FlashAttentionBackwardSm100._setup_attributes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackwardSm100._get_tiled_mma", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackwardSm100._setup_smem_layout", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackwardSm100.__call__", "n_typed": 23, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 24, "n_params": 23, "n_function_overloads": 1, "n_function_params": 23 }, { "kind": "function", "name": "FlashAttentionBackwardSm100.kernel", "n_typed": 52, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 54, "n_params": 53, "n_function_overloads": 1, "n_function_params": 53 }, { "kind": "function", "name": "FlashAttentionBackwardSm100.load", "n_typed": 30, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 31, "n_params": 30, "n_function_overloads": 1, "n_function_params": 30 }, { "kind": "function", "name": "FlashAttentionBackwardSm100.mma", "n_typed": 32, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 33, "n_params": 32, "n_function_overloads": 1, "n_function_params": 32 }, { "kind": "function", "name": "FlashAttentionBackwardSm100.split_wg", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FlashAttentionBackwardSm100.apply_score_mod", "n_typed": 0, "n_any": 0, "n_untyped": 12, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "FlashAttentionBackwardSm100.apply_score_mod_bwd", "n_typed": 0, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "FlashAttentionBackwardSm100.compute_loop", "n_typed": 36, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 38, "n_params": 37, "n_function_overloads": 1, "n_function_params": 37 }, { "kind": "function", "name": "FlashAttentionBackwardSm100.dQacc_reduce", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "FlashAttentionBackwardSm100.epilogue_dKV", "n_typed": 14, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "FlashAttentionBackwardSm100.epilogue_dK_or_dV_tma", "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttentionBackwardSm100.arch", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.tile_hdim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.same_hdim_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.tile_hdimv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.check_hdim_oob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.check_hdim_v_oob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.tile_m", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.tile_n", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.cta_tiler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.mma_tiler_kq", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.mma_tiler_vdo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.mma_tiler_pdo", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.mma_tiler_dsq", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.mma_tiler_dsk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.acc_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.cluster_shape_mn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.is_persistent", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.is_causal", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.is_local", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.qhead_per_kvhead", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.pack_gqa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.deterministic", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.score_mod", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.score_mod_bwd", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.mask_mod", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.has_aux_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.subtile_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.qk_acc_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.shuffle_LSE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.shuffle_dPsum", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.use_smem_dS_for_mma_dK", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.reduce_warp_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.compute_warp_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.mma_warp_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.load_warp_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.epi_warp_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.empty_warp_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.threads_per_cta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.compute_sync_barrier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.reduce_sync_barrier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.tmem_alloc_cols", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.tmem_S_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.tmem_P_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.tmem_dV_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.tmem_dP_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.tmem_dQ_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.tmem_dK_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.tmem_dS_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.num_regs_other", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.num_regs_empty", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.buffer_align_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.vec_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.num_regs_reduce", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm100.num_regs_compute", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 322, "n_typed": 232, "n_any": 0, "n_untyped": 90, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 254, "n_attrs": 54, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.flash_bwd_sm100", "names": [ "vllm.vllm_flash_attn.cute.flash_bwd_sm100.FlashAttentionBackwardSm100" ], "n_typable": 322, "n_typed": 232, "n_any": 0, "n_untyped": 90, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 254, "n_classes": 1, "n_attrs": 54, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/flash_bwd_sm90.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.flash_bwd_sm90.FlashAttentionBackwardSm90", "methods": [ { "kind": "function", "name": "FlashAttentionBackwardSm90.__init__", "n_typed": 23, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 24, "n_params": 23, "n_function_overloads": 1, "n_function_params": 23 }, { "kind": "function", "name": "FlashAttentionBackwardSm90.can_implement", "n_typed": 1, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "FlashAttentionBackwardSm90._check_type", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "FlashAttentionBackwardSm90._setup_attributes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackwardSm90._get_tiled_mma", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackwardSm90._get_shared_storage_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionBackwardSm90.__call__", "n_typed": 23, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 24, "n_params": 23, "n_function_overloads": 1, "n_function_params": 23 }, { "kind": "function", "name": "FlashAttentionBackwardSm90.kernel", "n_typed": 34, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 38, "n_params": 37, "n_function_overloads": 1, "n_function_params": 37 }, { "kind": "function", "name": "FlashAttentionBackwardSm90.load", "n_typed": 23, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 24, "n_params": 23, "n_function_overloads": 1, "n_function_params": 23 }, { "kind": "function", "name": "FlashAttentionBackwardSm90.apply_score_mod", "n_typed": 3, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "FlashAttentionBackwardSm90.apply_score_mod_bwd", "n_typed": 4, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "FlashAttentionBackwardSm90.mma", "n_typed": 33, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 35, "n_params": 34, "n_function_overloads": 1, "n_function_params": 34 }, { "kind": "function", "name": "FlashAttentionBackwardSm90.mma_one_m_block", "n_typed": 24, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 25, "n_params": 24, "n_function_overloads": 1, "n_function_params": 24 }, { "kind": "function", "name": "FlashAttentionBackwardSm90.epilogue_dKV", "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 }, { "kind": "function", "name": "FlashAttentionBackwardSm90.dQaccum_store", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttentionBackwardSm90.arch", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.tile_hdim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.same_hdim_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.tile_hdimv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.check_hdim_oob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.check_hdim_v_oob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.qhead_per_kvhead", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.is_causal", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.is_local", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.tile_m", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.tile_n", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.num_threads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.Q_stage", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.dO_stage", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.PdS_stage", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.SdP_swapAB", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.dKV_swapAB", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.dQ_swapAB", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.AtomLayoutMSdP", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.AtomLayoutNdKV", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.AtomLayoutMdQ", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.num_mma_warp_groups", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.mma_dkv_is_rs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.V_in_regs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.shuffle_LSE", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.shuffle_dPsum", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.score_mod", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.score_mod_bwd", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.mask_mod", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.has_aux_tensors", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.subtile_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.qk_acc_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionBackwardSm90.vec_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 274, "n_typed": 202, "n_any": 0, "n_untyped": 72, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 226, "n_attrs": 34, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.flash_bwd_sm90", "names": [ "vllm.vllm_flash_attn.cute.flash_bwd_sm90.FlashAttentionBackwardSm90" ], "n_typable": 274, "n_typed": 202, "n_any": 0, "n_untyped": 72, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 15, "n_method_overloads": 15, "n_method_params": 226, "n_classes": 1, "n_attrs": 34, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/flash_fwd.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.flash_fwd.FlashAttentionForwardSm80", "methods": [ { "kind": "function", "name": "FlashAttentionForwardSm80._get_smem_layout_atom", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionForwardSm80._get_tiled_mma", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionForwardSm80._get_shared_storage_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionForwardSm80.__call__", "n_typed": 10, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "FlashAttentionForwardSm80.kernel", "n_typed": 21, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 24, "n_params": 23, "n_function_overloads": 1, "n_function_params": 23 }, { "kind": "function", "name": "FlashAttentionForwardSm80.compute_one_n_block", "n_typed": 16, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 } ], "properties": [], "attrs": [], "n_typable": 58, "n_typed": 47, "n_any": 0, "n_untyped": 11, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 52, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.flash_fwd.FlashAttentionForwardBase", "methods": [ { "kind": "function", "name": "FlashAttentionForwardBase.__init__", "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "FlashAttentionForwardBase.can_implement", "n_typed": 1, "n_any": 0, "n_untyped": 9, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "FlashAttentionForwardBase._check_type", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "FlashAttentionForwardBase._setup_attributes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionForwardBase._get_smem_layout_atom", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionForwardBase._get_tiled_mma", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionForwardBase._get_shared_storage_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionForwardBase.__call__", "n_typed": 7, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "FlashAttentionForwardBase.epilogue", "n_typed": 13, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 14, "n_params": 13, "n_function_overloads": 1, "n_function_params": 13 }, { "kind": "function", "name": "FlashAttentionForwardBase.advance_pipeline", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashAttentionForwardBase.load_Q", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FlashAttentionForwardBase.load_K", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "FlashAttentionForwardBase.load_V", "n_typed": 10, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttentionForwardBase.arch", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.tile_hdim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.same_hdim_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.tile_hdimv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.check_hdim_oob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.check_hdim_v_oob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.qhead_per_kvhead", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.is_causal", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.is_local", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.pack_gqa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.tile_m", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.tile_n", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.num_threads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.num_stages", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.q_subtile_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.Q_in_regs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.score_mod", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.mask_mod", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.qk_acc_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardBase.vec_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "n_typable": 115, "n_typed": 74, "n_any": 0, "n_untyped": 41, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 81, "n_attrs": 21, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.flash_fwd.FlashAttentionForwardSm90", "methods": [ { "kind": "function", "name": "FlashAttentionForwardSm90.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashAttentionForwardSm90._get_smem_layout_atom", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionForwardSm90._get_tiled_mma", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionForwardSm90._get_shared_storage_cls", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionForwardSm90.__call__", "n_typed": 17, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 }, { "kind": "function", "name": "FlashAttentionForwardSm90.kernel", "n_typed": 33, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 36, "n_params": 35, "n_function_overloads": 1, "n_function_params": 35 }, { "kind": "function", "name": "FlashAttentionForwardSm90.load", "n_typed": 16, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 17, "n_params": 16, "n_function_overloads": 1, "n_function_params": 16 }, { "kind": "function", "name": "FlashAttentionForwardSm90.mma", "n_typed": 26, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 28, "n_params": 27, "n_function_overloads": 1, "n_function_params": 27 }, { "kind": "function", "name": "FlashAttentionForwardSm90.first_half_block_overlap", "n_typed": 9, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "FlashAttentionForwardSm90.last_half_block_overlap", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashAttentionForwardSm90.mma_one_n_block", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "FlashAttentionForwardSm90.mma_one_n_block_intrawg_overlap", "n_typed": 14, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "FlashAttentionForwardSm90.mma_init", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionForwardSm90.apply_score_mod", "n_typed": 1, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "FlashAttentionForwardSm90.warp_scheduler_barrier_sync", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionForwardSm90.warp_scheduler_barrier_arrive", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttentionForwardSm90.arch", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionForwardSm90.intra_wg_overlap", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm90.mma_pv_is_rs", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm90.buffer_align_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 172, "n_typed": 135, "n_any": 0, "n_untyped": 37, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 16, "n_method_overloads": 16, "n_method_params": 153, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.flash_fwd", "names": [ "vllm.vllm_flash_attn.cute.flash_fwd.FlashAttentionForwardBase", "vllm.vllm_flash_attn.cute.flash_fwd.FlashAttentionForwardSm80", "vllm.vllm_flash_attn.cute.flash_fwd.FlashAttentionForwardSm90" ], "n_typable": 345, "n_typed": 256, "n_any": 0, "n_untyped": 89, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 35, "n_method_overloads": 35, "n_method_params": 286, "n_classes": 3, "n_attrs": 25, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/flash_fwd_combine.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.flash_fwd_combine.FlashAttentionForwardCombine", "methods": [ { "kind": "function", "name": "FlashAttentionForwardCombine.__init__", "n_typed": 8, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "FlashAttentionForwardCombine.can_implement", "n_typed": 1, "n_any": 0, "n_untyped": 7, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "function", "name": "FlashAttentionForwardCombine._setup_attributes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionForwardCombine.__call__", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "FlashAttentionForwardCombine.kernel", "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 }, { "kind": "function", "name": "FlashAttentionForwardCombine.load_O_partial", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttentionForwardCombine.dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardCombine.dtype_partial", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardCombine.head_dim", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardCombine.m_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardCombine.k_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardCombine.max_splits", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardCombine.num_threads", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardCombine.is_even_k", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardCombine.stages", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 66, "n_typed": 46, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 51, "n_attrs": 9, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.flash_fwd_combine", "names": [ "vllm.vllm_flash_attn.cute.flash_fwd_combine.FlashAttentionForwardCombine" ], "n_typable": 66, "n_typed": 46, "n_any": 0, "n_untyped": 20, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 51, "n_classes": 1, "n_attrs": 9, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/flash_fwd_sm100.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.flash_fwd_sm100.FlashAttentionForwardSm100", "methods": [ { "kind": "function", "name": "FlashAttentionForwardSm100.__init__", "n_typed": 17, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 }, { "kind": "function", "name": "FlashAttentionForwardSm100._setup_attributes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "FlashAttentionForwardSm100.__call__", "n_typed": 17, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 18, "n_params": 17, "n_function_overloads": 1, "n_function_params": 17 }, { "kind": "function", "name": "FlashAttentionForwardSm100.kernel", "n_typed": 31, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 34, "n_params": 33, "n_function_overloads": 1, "n_function_params": 33 }, { "kind": "function", "name": "FlashAttentionForwardSm100.load", "n_typed": 19, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 20, "n_params": 19, "n_function_overloads": 1, "n_function_params": 19 }, { "kind": "function", "name": "FlashAttentionForwardSm100.mma", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "FlashAttentionForwardSm100.softmax_loop", "n_typed": 16, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 }, { "kind": "function", "name": "FlashAttentionForwardSm100.softmax_step", "n_typed": 23, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 26, "n_params": 25, "n_function_overloads": 1, "n_function_params": 25 }, { "kind": "function", "name": "FlashAttentionForwardSm100.correction_loop", "n_typed": 18, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 19, "n_params": 18, "n_function_overloads": 1, "n_function_params": 18 }, { "kind": "function", "name": "FlashAttentionForwardSm100.correction_rescale", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "FlashAttentionForwardSm100.correction_epilogue", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "FlashAttentionForwardSm100.epilogue_s2g", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "FlashAttentionForwardSm100.load_Q", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "FlashAttentionForwardSm100.load_KV", "n_typed": 11, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 12, "n_params": 11, "n_function_overloads": 1, "n_function_params": 11 }, { "kind": "function", "name": "FlashAttentionForwardSm100.offset_kv_smem", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "FlashAttentionForwardSm100.make_and_init_load_kv_pipeline", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "FlashAttentionForwardSm100.apply_score_mod", "n_typed": 1, "n_any": 0, "n_untyped": 12, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "FlashAttentionForwardSm100.arch", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.use_tma_KV", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.head_dim_padded", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.same_hdim_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.head_dim_v_padded", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.same_hdim_kv_padded", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.check_hdim_oob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.check_hdim_v_oob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.m_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.n_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.q_stage", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.cta_tiler", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.mma_tiler_qk", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.mma_tiler_pv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.qk_acc_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.pv_acc_dtype", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.cluster_shape_mn", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.is_persistent", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.is_causal", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.is_local", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.is_varlen_q", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.use_correction_warps_for_epi", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.qhead_per_kvhead", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.is_split_kv", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.pack_gqa", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.q_subtile_factor", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.score_mod", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.mask_mod", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.s0_s1_barrier", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.overlap_sO_sQ", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.softmax0_warp_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.softmax1_warp_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.correction_warp_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.mma_warp_id", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.epilogue_warp_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.load_warp_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.empty_warp_ids", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.tmem_alloc_cols", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.threads_per_cta", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.tmem_s_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.tmem_o_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.tmem_total", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.tmem_s_to_p_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.tmem_p_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.tmem_vec_offset", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.num_regs_empty", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.buffer_align_bytes", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.vec_size", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.num_regs_softmax", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.num_regs_correction", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "FlashAttentionForwardSm100.num_regs_other", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 286, "n_typed": 202, "n_any": 0, "n_untyped": 84, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 219, "n_attrs": 51, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.flash_fwd_sm100.NamedBarrierFwd", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NamedBarrierFwd.Epilogue", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.flash_fwd_sm100", "names": [ "vllm.vllm_flash_attn.cute.flash_fwd_sm100.FlashAttentionForwardSm100", "vllm.vllm_flash_attn.cute.flash_fwd_sm100.NamedBarrierFwd" ], "n_typable": 286, "n_typed": 202, "n_any": 0, "n_untyped": 84, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 17, "n_method_overloads": 17, "n_method_params": 219, "n_classes": 2, "n_attrs": 52, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/hopper_helpers.py", "symbol_reports": [ { "kind": "function", "name": "vllm.vllm_flash_attn.cute.hopper_helpers.gemm_w_idx", "n_typed": 10, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.hopper_helpers.gemm_zero_init", "n_typed": 9, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.hopper_helpers.make_smem_layout", "n_typed": 5, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.hopper_helpers.gemm", "n_typed": 8, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.hopper_helpers", "names": [ "vllm.vllm_flash_attn.cute.hopper_helpers.gemm", "vllm.vllm_flash_attn.cute.hopper_helpers.gemm_w_idx", "vllm.vllm_flash_attn.cute.hopper_helpers.gemm_zero_init", "vllm.vllm_flash_attn.cute.hopper_helpers.make_smem_layout" ], "n_typable": 34, "n_typed": 32, "n_any": 0, "n_untyped": 2, "n_functions": 4, "n_function_overloads": 4, "n_function_params": 30, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/mask.py", "symbol_reports": [ { "kind": "function", "name": "vllm.vllm_flash_attn.cute.mask.mask_r2p", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.mask.mask_r2p_transposed", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.mask.AttentionMask", "methods": [ { "kind": "function", "name": "AttentionMask.apply_mask", "n_typed": 12, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "function", "name": "AttentionMask.apply_mask_sm100", "n_typed": 14, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "function", "name": "AttentionMask.apply_mask_sm100_transposed", "n_typed": 15, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 } ], "properties": [ { "kind": "property", "name": "AttentionMask.seqlen_q", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "AttentionMask.seqlen_k", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [ { "kind": "attr", "name": "AttentionMask.tile_m", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionMask.tile_n", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionMask.seqlen_info", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionMask.window_size_left", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionMask.window_size_right", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionMask.qhead_per_kvhead_packgqa", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "AttentionMask.swap_AB", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 47, "n_typed": 43, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 42, "n_attrs": 7, "n_properties": 2 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.mask.mask_r2p_dual_bound", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.mask", "names": [ "vllm.vllm_flash_attn.cute.mask.AttentionMask", "vllm.vllm_flash_attn.cute.mask.mask_r2p", "vllm.vllm_flash_attn.cute.mask.mask_r2p_dual_bound", "vllm.vllm_flash_attn.cute.mask.mask_r2p_transposed" ], "n_typable": 60, "n_typed": 56, "n_any": 0, "n_untyped": 4, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 10, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 42, "n_classes": 1, "n_attrs": 7, "n_properties": 2, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/mma_sm100_desc.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc.CFormat", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "CFormat.F16", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CFormat.F32", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "CFormat.S32", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc.make_smem_desc_base", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc.to_C_format", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc.S8Format", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "S8Format.UINT8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "S8Format.INT8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc.make_smem_desc_start_addr", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc.mma_op_to_idesc", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc.F16F32Format", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "F16F32Format.F16", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "F16F32Format.BF16", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "F16F32Format.TF32", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 3, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc.Major", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Major.K", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Major.MN", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc.to_UMMA_format", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc.Saturate", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "Saturate.False_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Saturate.True_", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc.MXF8F6F4Format", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MXF8F6F4Format.E4M3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MXF8F6F4Format.E5M2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MXF8F6F4Format.E2M3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MXF8F6F4Format.E3M2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MXF8F6F4Format.E2M1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc.ScaleIn", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "ScaleIn.One", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "ScaleIn.Neg", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 2, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc.MaxShift", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "MaxShift.NoShift", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MaxShift.MaxShift8", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MaxShift.MaxShift16", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "MaxShift.MaxShift32", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc.make_instr_desc", "n_typed": 10, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 13, "n_params": 12, "n_function_overloads": 1, "n_function_params": 12 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc.LayoutType", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "LayoutType.SWIZZLE_NONE", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayoutType.SWIZZLE_128B_BASE32B", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayoutType.SWIZZLE_128B", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayoutType.SWIZZLE_64B", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "LayoutType.SWIZZLE_32B", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 5, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.mma_sm100_desc", "names": [ "vllm.vllm_flash_attn.cute.mma_sm100_desc.CFormat", "vllm.vllm_flash_attn.cute.mma_sm100_desc.F16F32Format", "vllm.vllm_flash_attn.cute.mma_sm100_desc.LayoutType", "vllm.vllm_flash_attn.cute.mma_sm100_desc.MXF8F6F4Format", "vllm.vllm_flash_attn.cute.mma_sm100_desc.Major", "vllm.vllm_flash_attn.cute.mma_sm100_desc.MaxShift", "vllm.vllm_flash_attn.cute.mma_sm100_desc.S8Format", "vllm.vllm_flash_attn.cute.mma_sm100_desc.Saturate", "vllm.vllm_flash_attn.cute.mma_sm100_desc.ScaleIn", "vllm.vllm_flash_attn.cute.mma_sm100_desc.make_instr_desc", "vllm.vllm_flash_attn.cute.mma_sm100_desc.make_smem_desc_base", "vllm.vllm_flash_attn.cute.mma_sm100_desc.make_smem_desc_start_addr", "vllm.vllm_flash_attn.cute.mma_sm100_desc.mma_op_to_idesc", "vllm.vllm_flash_attn.cute.mma_sm100_desc.to_C_format", "vllm.vllm_flash_attn.cute.mma_sm100_desc.to_UMMA_format" ], "n_typable": 25, "n_typed": 19, "n_any": 0, "n_untyped": 6, "n_functions": 6, "n_function_overloads": 6, "n_function_params": 19, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 9, "n_attrs": 28, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/named_barrier.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.named_barrier.NamedBarrierBwd", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NamedBarrierBwd.Epilogue", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierBwd.WarpSchedulerWG1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierBwd.WarpSchedulerWG2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierBwd.WarpSchedulerWG3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierBwd.PdS", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierBwd.dQFullWG0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierBwd.dQFullWG1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierBwd.dQEmptyWG0", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierBwd.dQEmptyWG1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 9, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.named_barrier.NamedBarrierBwdSm100", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NamedBarrierBwdSm100.EpilogueWG1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierBwdSm100.EpilogueWG2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierBwdSm100.Compute", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierBwdSm100.dQaccReduce", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 4, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.named_barrier.NamedBarrierFwd", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "NamedBarrierFwd.Epilogue", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierFwd.WarpSchedulerWG1", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierFwd.WarpSchedulerWG2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierFwd.WarpSchedulerWG3", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierFwd.PFull", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "NamedBarrierFwd.PEmpty", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 6, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.named_barrier", "names": [ "vllm.vllm_flash_attn.cute.named_barrier.NamedBarrierBwd", "vllm.vllm_flash_attn.cute.named_barrier.NamedBarrierBwdSm100", "vllm.vllm_flash_attn.cute.named_barrier.NamedBarrierFwd" ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 3, "n_attrs": 19, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/pack_gqa.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.pack_gqa.PackGQA", "methods": [ { "kind": "function", "name": "PackGQA.__init__", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "PackGQA.compute_ptr", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "PackGQA.load_Q", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "PackGQA.store_LSE", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "PackGQA.store_O", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PackGQA.m_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PackGQA.head_dim_padded", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PackGQA.check_hdim_oob", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 }, { "kind": "attr", "name": "PackGQA.qhead_per_kvhead", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 37, "n_typed": 28, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 28, "n_attrs": 4, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.pack_gqa", "names": [ "vllm.vllm_flash_attn.cute.pack_gqa.PackGQA" ], "n_typable": 37, "n_typed": 28, "n_any": 0, "n_untyped": 9, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 28, "n_classes": 1, "n_attrs": 4, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/paged_kv.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.paged_kv.PagedKVManager", "methods": [ { "kind": "function", "name": "PagedKVManager.create", "n_typed": 14, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "PagedKVManager.load_page_table", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PagedKVManager.compute_X_ptr", "n_typed": 1, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "PagedKVManager.load_KV", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "PagedKVManager.mPageTable", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.mK_paged", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.mV_paged", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.thread_idx", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.page_size_divmod", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.seqlen_k", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.leftpad_k", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.n_block_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.num_threads", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.head_dim_padded", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.head_dim_v_padded", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.gmem_threads_per_row", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.page_entry_per_thread", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.async_copy_elems", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.gmem_tiled_copy_KV", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.gmem_thr_copy_KV", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.tPrPage", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.tPrPageOffset", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.tKpK", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "PagedKVManager.tVpV", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 23, "n_typed": 19, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 19, "n_attrs": 20, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.paged_kv", "names": [ "vllm.vllm_flash_attn.cute.paged_kv.PagedKVManager" ], "n_typable": 23, "n_typed": 19, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 19, "n_classes": 1, "n_attrs": 20, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/pipeline.py", "symbol_reports": [ { "kind": "function", "name": "vllm.vllm_flash_attn.cute.pipeline.make_pipeline_state", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.pipeline.PipelineStateSimple", "methods": [ { "kind": "function", "name": "PipelineStateSimple.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PipelineStateSimple.clone", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PipelineStateSimple.advance", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PipelineStateSimple.__extract_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "PipelineStateSimple.__new_from_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [ { "kind": "property", "name": "PipelineStateSimple.stages", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PipelineStateSimple.index", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 }, { "kind": "property", "name": "PipelineStateSimple.phase", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_typable": 1 } ], "attrs": [], "n_typable": 11, "n_typed": 6, "n_any": 0, "n_untyped": 5, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 5, "n_method_overloads": 5, "n_method_params": 3, "n_attrs": 0, "n_properties": 3 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.pipeline.PipelineTmaUmma", "methods": [ { "kind": "function", "name": "PipelineTmaUmma.create", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PipelineTmaUmma.producer_acquire", "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 3, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.pipeline.PipelineTmaAsync", "methods": [ { "kind": "function", "name": "PipelineTmaAsync.create", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "PipelineTmaAsync.producer_acquire", "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 } ], "properties": [], "attrs": [], "n_typable": 9, "n_typed": 3, "n_any": 0, "n_untyped": 6, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 7, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.pipeline", "names": [ "vllm.vllm_flash_attn.cute.pipeline.PipelineStateSimple", "vllm.vllm_flash_attn.cute.pipeline.PipelineTmaAsync", "vllm.vllm_flash_attn.cute.pipeline.PipelineTmaUmma", "vllm.vllm_flash_attn.cute.pipeline.make_pipeline_state" ], "n_typable": 32, "n_typed": 14, "n_any": 0, "n_untyped": 18, "n_functions": 1, "n_function_overloads": 1, "n_function_params": 2, "n_methods": 9, "n_method_overloads": 9, "n_method_params": 17, "n_classes": 3, "n_attrs": 0, "n_properties": 3, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/seqlen_info.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.seqlen_info.SeqlenInfoQK", "methods": [ { "kind": "function", "name": "SeqlenInfoQK.create", "n_typed": 9, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 10, "n_params": 9, "n_function_overloads": 1, "n_function_params": 9 }, { "kind": "function", "name": "SeqlenInfoQK.offset_batch_Q", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SeqlenInfoQK.offset_batch_K", "n_typed": 5, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SeqlenInfoQK.offset_q", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SeqlenInfoQK.offset_k", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SeqlenInfoQK.padded_offset_q", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SeqlenInfoQK.padded_offset_k", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SeqlenInfoQK.seqlen_q", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SeqlenInfoQK.seqlen_k", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SeqlenInfoQK.has_cu_seqlens_q", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SeqlenInfoQK.has_cu_seqlens_k", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SeqlenInfoQK.has_seqused_q", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SeqlenInfoQK.has_seqused_k", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 20, "n_typed": 19, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 3, "n_method_overloads": 3, "n_method_params": 17, "n_attrs": 10, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.seqlen_info.SeqlenInfo", "methods": [ { "kind": "function", "name": "SeqlenInfo.create", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SeqlenInfo.offset", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "SeqlenInfo.seqlen", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 5, "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 4, "n_attrs": 2, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.seqlen_info", "names": [ "vllm.vllm_flash_attn.cute.seqlen_info.SeqlenInfo", "vllm.vllm_flash_attn.cute.seqlen_info.SeqlenInfoQK" ], "n_typable": 25, "n_typed": 23, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 21, "n_classes": 2, "n_attrs": 12, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/softmax.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.softmax.Softmax", "methods": [ { "kind": "function", "name": "Softmax.create", "n_typed": 4, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "Softmax.reset", "n_typed": 1, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "Softmax._compute_row_max", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Softmax._compute_row_sum", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Softmax.online_softmax", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "Softmax.finalize", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "Softmax.rescale_O", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Softmax.scale_log2", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Softmax.num_rows", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Softmax.row_max", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Softmax.row_sum", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Softmax.arch", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Softmax.softmax_scale", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 22, "n_typed": 21, "n_any": 0, "n_untyped": 1, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 7, "n_method_overloads": 7, "n_method_params": 15, "n_attrs": 6, "n_properties": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.softmax.apply_score_mod_bwd_inner", "n_typed": 6, "n_any": 0, "n_untyped": 10, "n_overloads": 1, "n_typable": 16, "n_params": 15, "n_function_overloads": 1, "n_function_params": 15 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.softmax.SoftmaxSm100", "methods": [ { "kind": "function", "name": "SoftmaxSm100.create", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SoftmaxSm100.update_row_max", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SoftmaxSm100.update_row_sum", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SoftmaxSm100.scale_subtract_rowmax", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SoftmaxSm100.apply_exp2_convert", "n_typed": 6, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 7, "n_params": 6, "n_function_overloads": 1, "n_function_params": 6 }, { "kind": "function", "name": "SoftmaxSm100.scale_apply_exp2_convert", "n_typed": 3, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SoftmaxSm100.rescale_threshold", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 25, "n_typed": 21, "n_any": 0, "n_untyped": 4, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 6, "n_method_overloads": 6, "n_method_params": 19, "n_attrs": 1, "n_properties": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.softmax.apply_score_mod_inner", "n_typed": 7, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 15, "n_params": 14, "n_function_overloads": 1, "n_function_params": 14 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.softmax.floor_if_packed", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.softmax", "names": [ "vllm.vllm_flash_attn.cute.softmax.Softmax", "vllm.vllm_flash_attn.cute.softmax.SoftmaxSm100", "vllm.vllm_flash_attn.cute.softmax.apply_score_mod_bwd_inner", "vllm.vllm_flash_attn.cute.softmax.apply_score_mod_inner", "vllm.vllm_flash_attn.cute.softmax.floor_if_packed" ], "n_typable": 81, "n_typed": 57, "n_any": 0, "n_untyped": 24, "n_functions": 3, "n_function_overloads": 3, "n_function_params": 31, "n_methods": 13, "n_method_overloads": 13, "n_method_params": 34, "n_classes": 2, "n_attrs": 7, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/testing.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.testing.IndexFirstAxis", "methods": [ { "kind": "function", "name": "IndexFirstAxis.forward", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "IndexFirstAxis.backward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 7, "n_typed": 0, "n_any": 0, "n_untyped": 7, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 5, "n_attrs": 0, "n_properties": 0 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.testing.construct_local_mask", "n_typed": 0, "n_any": 0, "n_untyped": 9, "n_overloads": 1, "n_typable": 9, "n_params": 8, "n_function_overloads": 1, "n_function_params": 8 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.testing.unpad_input", "n_typed": 0, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.testing.generate_qkv", "n_typed": 0, "n_any": 0, "n_untyped": 11, "n_overloads": 1, "n_typable": 11, "n_params": 10, "n_function_overloads": 1, "n_function_params": 10 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.testing.pad_input", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.testing.attention_ref", "n_typed": 1, "n_any": 0, "n_untyped": 22, "n_overloads": 1, "n_typable": 23, "n_params": 22, "n_function_overloads": 1, "n_function_params": 22 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.testing.generate_random_padding_mask", "n_typed": 0, "n_any": 0, "n_untyped": 6, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.testing.construct_chunk_mask", "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_overloads": 1, "n_typable": 8, "n_params": 7, "n_function_overloads": 1, "n_function_params": 7 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.testing.IndexPutFirstAxis", "methods": [ { "kind": "function", "name": "IndexPutFirstAxis.forward", "n_typed": 0, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "IndexPutFirstAxis.backward", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 } ], "properties": [], "attrs": [], "n_typable": 8, "n_typed": 0, "n_any": 0, "n_untyped": 8, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 6, "n_attrs": 0, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.testing", "names": [ "vllm.vllm_flash_attn.cute.testing.IndexFirstAxis", "vllm.vllm_flash_attn.cute.testing.IndexPutFirstAxis", "vllm.vllm_flash_attn.cute.testing.attention_ref", "vllm.vllm_flash_attn.cute.testing.construct_chunk_mask", "vllm.vllm_flash_attn.cute.testing.construct_local_mask", "vllm.vllm_flash_attn.cute.testing.generate_qkv", "vllm.vllm_flash_attn.cute.testing.generate_random_padding_mask", "vllm.vllm_flash_attn.cute.testing.pad_input", "vllm.vllm_flash_attn.cute.testing.unpad_input" ], "n_typable": 81, "n_typed": 1, "n_any": 0, "n_untyped": 80, "n_functions": 7, "n_function_overloads": 7, "n_function_params": 59, "n_methods": 4, "n_method_overloads": 4, "n_method_params": 11, "n_classes": 2, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/tile_scheduler.py", "symbol_reports": [ { "kind": "class", "name": "vllm.vllm_flash_attn.cute.tile_scheduler.SingleTileLPTScheduler", "methods": [ { "kind": "function", "name": "SingleTileLPTScheduler.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "SingleTileLPTScheduler.to_underlying_arguments", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SingleTileLPTScheduler.create", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SingleTileLPTScheduler.get_grid_shape", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SingleTileLPTScheduler.get_current_work", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileLPTScheduler.initial_work_tile_info", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileLPTScheduler.prefetch_next_work", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileLPTScheduler.advance_to_next_work", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileLPTScheduler.__extract_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SingleTileLPTScheduler.__new_from_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SingleTileLPTScheduler.params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 34, "n_typed": 10, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 23, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.tile_scheduler.ParamsBase", "methods": [ { "kind": "function", "name": "ParamsBase.__extract_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "ParamsBase.__new_from_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 3, "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 2, "n_method_overloads": 2, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.tile_scheduler.SingleTileScheduler", "methods": [ { "kind": "function", "name": "SingleTileScheduler.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SingleTileScheduler.to_underlying_arguments", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SingleTileScheduler.create", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SingleTileScheduler.get_grid_shape", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SingleTileScheduler.get_current_work", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileScheduler.initial_work_tile_info", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileScheduler.prefetch_next_work", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileScheduler.advance_to_next_work", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileScheduler.__extract_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SingleTileScheduler.__new_from_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SingleTileScheduler.params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 9, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 22, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.tile_scheduler.WorkTileInfo", "methods": [ { "kind": "function", "name": "WorkTileInfo.__new_from_mlir_values__", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [], "n_typable": 2, "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 1, "n_attrs": 0, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.tile_scheduler.TileSchedulerArguments", "methods": [], "properties": [], "attrs": [ { "kind": "attr", "name": "TileSchedulerArguments.num_block", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.num_head", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.num_batch", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.num_splits", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.seqlen_k", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.headdim", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.headdim_v", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.total_q", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.tile_shape_mn", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.cluster_shape_mn", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.mCuSeqlensQ", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.mSeqUsedQ", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.qhead_per_kvhead_packgqa", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.element_size", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.is_persistent", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.lpt", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.is_split_kv", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "TileSchedulerArguments.head_swizzle", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 0, "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_attrs": 18, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.tile_scheduler.SingleTileVarlenScheduler", "methods": [ { "kind": "function", "name": "SingleTileVarlenScheduler.__init__", "n_typed": 3, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "SingleTileVarlenScheduler.to_underlying_arguments", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SingleTileVarlenScheduler.create", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SingleTileVarlenScheduler.get_grid_shape", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SingleTileVarlenScheduler._get_num_m_blocks", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileVarlenScheduler.get_current_work", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileVarlenScheduler.initial_work_tile_info", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileVarlenScheduler.prefetch_next_work", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileVarlenScheduler.advance_to_next_work", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileVarlenScheduler.__extract_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SingleTileVarlenScheduler.__new_from_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SingleTileVarlenScheduler.params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 37, "n_typed": 13, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 11, "n_method_overloads": 11, "n_method_params": 25, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.tile_scheduler.Params", "methods": [ { "kind": "function", "name": "Params.create", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "Params.num_block", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Params.num_head", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Params.num_batch", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Params.num_splits", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Params.num_splits_divmod", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Params.is_split_kv", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 }, { "kind": "attr", "name": "Params.cluster_shape_mn", "n_typed": 0, "n_any": 0, "n_untyped": 0, "n_typable": 0 } ], "n_typable": 4, "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 1, "n_method_overloads": 1, "n_method_params": 3, "n_attrs": 7, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.tile_scheduler.SingleTileLPTBwdScheduler", "methods": [ { "kind": "function", "name": "SingleTileLPTBwdScheduler.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "SingleTileLPTBwdScheduler.to_underlying_arguments", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SingleTileLPTBwdScheduler.create", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SingleTileLPTBwdScheduler.get_grid_shape", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "SingleTileLPTBwdScheduler.get_current_work", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileLPTBwdScheduler.initial_work_tile_info", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileLPTBwdScheduler.prefetch_next_work", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileLPTBwdScheduler.advance_to_next_work", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "SingleTileLPTBwdScheduler.__extract_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "SingleTileLPTBwdScheduler.__new_from_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "SingleTileLPTBwdScheduler.params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 9, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 22, "n_attrs": 1, "n_properties": 0 }, { "kind": "class", "name": "vllm.vllm_flash_attn.cute.tile_scheduler.StaticPersistentTileScheduler", "methods": [ { "kind": "function", "name": "StaticPersistentTileScheduler.__init__", "n_typed": 2, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "StaticPersistentTileScheduler.to_underlying_arguments", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "StaticPersistentTileScheduler.create", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "StaticPersistentTileScheduler.get_grid_shape", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "StaticPersistentTileScheduler.get_current_work", "n_typed": 1, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StaticPersistentTileScheduler.initial_work_tile_info", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StaticPersistentTileScheduler.prefetch_next_work", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StaticPersistentTileScheduler.advance_to_next_work", "n_typed": 0, "n_any": 0, "n_untyped": 3, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "StaticPersistentTileScheduler.__extract_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 1, "n_params": 0, "n_function_overloads": 1, "n_function_params": 0 }, { "kind": "function", "name": "StaticPersistentTileScheduler.__new_from_mlir_values__", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 } ], "properties": [], "attrs": [ { "kind": "attr", "name": "StaticPersistentTileScheduler.params", "n_typed": 0, "n_any": 0, "n_untyped": 1, "n_typable": 1 } ], "n_typable": 33, "n_typed": 9, "n_any": 0, "n_untyped": 24, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 10, "n_method_overloads": 10, "n_method_params": 22, "n_attrs": 1, "n_properties": 0 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.tile_scheduler", "names": [ "vllm.vllm_flash_attn.cute.tile_scheduler.Params", "vllm.vllm_flash_attn.cute.tile_scheduler.ParamsBase", "vllm.vllm_flash_attn.cute.tile_scheduler.SingleTileLPTBwdScheduler", "vllm.vllm_flash_attn.cute.tile_scheduler.SingleTileLPTScheduler", "vllm.vllm_flash_attn.cute.tile_scheduler.SingleTileScheduler", "vllm.vllm_flash_attn.cute.tile_scheduler.SingleTileVarlenScheduler", "vllm.vllm_flash_attn.cute.tile_scheduler.StaticPersistentTileScheduler", "vllm.vllm_flash_attn.cute.tile_scheduler.TileSchedulerArguments", "vllm.vllm_flash_attn.cute.tile_scheduler.WorkTileInfo" ], "n_typable": 179, "n_typed": 54, "n_any": 0, "n_untyped": 125, "n_functions": 0, "n_function_overloads": 0, "n_function_params": 0, "n_methods": 55, "n_method_overloads": 55, "n_method_params": 119, "n_classes": 9, "n_attrs": 30, "n_properties": 0, "n_type_ignores": 0 }, { "path": "vllm/vllm_flash_attn/cute/utils.py", "symbol_reports": [ { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.add_round_down", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.fmax", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.ex2_emulation", "n_typed": 2, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.warp_reduce", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.ssa_to_scalar", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.convert_from_dlpack_leading_static", "n_typed": 1, "n_any": 0, "n_untyped": 5, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.atomic_add_fp32", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.cvt_f16", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 2, "n_typable": 4, "n_params": 3, "n_function_overloads": 2, "n_function_params": 3 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.shuffle_sync", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.evaluate_polynomial_2", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.scalar_to_ssa", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.cvt_f16x2_f32", "n_typed": 4, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 6, "n_params": 5, "n_function_overloads": 1, "n_function_params": 5 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.fadd_reduce", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.make_tiled_copy_A", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.domain_offset_aligned", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.canonical_warp_group_idx", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.parse_swizzle_from_pointer", "n_typed": 2, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.create_softcap_scoremod", "n_typed": 0, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 2, "n_params": 1, "n_function_overloads": 1, "n_function_params": 1 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.warp_prefix_sum", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.e2e_asm2", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.hash_callable", "n_typed": 2, "n_any": 0, "n_untyped": 1, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.fmax_reduce", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.predicate_k", "n_typed": 3, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 3, "n_params": 2, "n_function_overloads": 1, "n_function_params": 2 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.shr_u32", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.combine_int_frac_ex2", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.ex2_emulation_2", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.evaluate_polynomial", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.make_tiled_copy_B", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.get_smem_store_atom", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.convert_from_dlpack", "n_typed": 1, "n_any": 0, "n_untyped": 4, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.mma_make_fragment_A", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.elem_pointer", "n_typed": 3, "n_any": 0, "n_untyped": 2, "n_overloads": 1, "n_typable": 5, "n_params": 4, "n_function_overloads": 1, "n_function_params": 4 }, { "kind": "function", "name": "vllm.vllm_flash_attn.cute.utils.mma_make_fragment_B", "n_typed": 4, "n_any": 0, "n_untyped": 0, "n_overloads": 1, "n_typable": 4, "n_params": 3, "n_function_overloads": 1, "n_function_params": 3 } ], "type_ignores": [], "name": "vllm.vllm_flash_attn.cute.utils", "names": [ "vllm.vllm_flash_attn.cute.utils.add_round_down", "vllm.vllm_flash_attn.cute.utils.atomic_add_fp32", "vllm.vllm_flash_attn.cute.utils.canonical_warp_group_idx", "vllm.vllm_flash_attn.cute.utils.combine_int_frac_ex2", "vllm.vllm_flash_attn.cute.utils.convert_from_dlpack", "vllm.vllm_flash_attn.cute.utils.convert_from_dlpack_leading_static", "vllm.vllm_flash_attn.cute.utils.create_softcap_scoremod", "vllm.vllm_flash_attn.cute.utils.cvt_f16", "vllm.vllm_flash_attn.cute.utils.cvt_f16x2_f32", "vllm.vllm_flash_attn.cute.utils.domain_offset_aligned", "vllm.vllm_flash_attn.cute.utils.e2e_asm2", "vllm.vllm_flash_attn.cute.utils.elem_pointer", "vllm.vllm_flash_attn.cute.utils.evaluate_polynomial", "vllm.vllm_flash_attn.cute.utils.evaluate_polynomial_2", "vllm.vllm_flash_attn.cute.utils.ex2_emulation", "vllm.vllm_flash_attn.cute.utils.ex2_emulation_2", "vllm.vllm_flash_attn.cute.utils.fadd_reduce", "vllm.vllm_flash_attn.cute.utils.fmax", "vllm.vllm_flash_attn.cute.utils.fmax_reduce", "vllm.vllm_flash_attn.cute.utils.get_smem_store_atom", "vllm.vllm_flash_attn.cute.utils.hash_callable", "vllm.vllm_flash_attn.cute.utils.make_tiled_copy_A", "vllm.vllm_flash_attn.cute.utils.make_tiled_copy_B", "vllm.vllm_flash_attn.cute.utils.mma_make_fragment_A", "vllm.vllm_flash_attn.cute.utils.mma_make_fragment_B", "vllm.vllm_flash_attn.cute.utils.parse_swizzle_from_pointer", "vllm.vllm_flash_attn.cute.utils.predicate_k", "vllm.vllm_flash_attn.cute.utils.scalar_to_ssa", "vllm.vllm_flash_attn.cute.utils.shr_u32", "vllm.vllm_flash_attn.cute.utils.shuffle_sync", "vllm.vllm_flash_attn.cute.utils.ssa_to_scalar", "vllm.vllm_flash_attn.cute.utils.warp_prefix_sum", "vllm.vllm_flash_attn.cute.utils.warp_reduce" ], "n_typable": 138, "n_typed": 97, "n_any": 0, "n_untyped": 41, "n_functions": 33, "n_function_overloads": 34, "n_function_params": 105, "n_methods": 0, "n_method_overloads": 0, "n_method_params": 0, "n_classes": 0, "n_attrs": 0, "n_properties": 0, "n_type_ignores": 0 } ], "typecheckers": {}, "n_modules": 1264, "n_typable": 72507, "n_typed": 49485, "n_any": 333, "n_untyped": 22689, "n_functions": 2755, "n_function_overloads": 2798, "n_function_params": 9084, "n_methods": 13408, "n_method_params": 29905, "n_method_overloads": 13428, "n_classes": 3834, "n_attrs": 21235, "n_properties": 676, "type_ignores": [ { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "misc" ] }, { "kind": "type", "rules": [ "misc" ] }, { "kind": "type", "rules": [ "misc" ] }, { "kind": "type", "rules": [ "misc" ] }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "import-not-found" ] }, { "kind": "type", "rules": [ "import-not-found" ] }, { "kind": "type", "rules": [ "no-redef" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "override" ] }, { "kind": "type", "rules": [ "override" ] }, { "kind": "type", "rules": [ "override" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "misc" ] }, { "kind": "type", "rules": [ "misc" ] }, { "kind": "type", "rules": [ "misc" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "no-redef" ] }, { "kind": "type", "rules": [ "arg-type" ] }, { "kind": "type", "rules": [ "arg-type" ] }, { "kind": "type", "rules": [ "arg-type" ] }, { "kind": "type", "rules": [ "attr-defined" ] }, { "kind": "type", "rules": null }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": [ "misc" ] }, { "kind": "type", "rules": [ "misc" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "type-var" ] }, { "kind": "type", "rules": [ "type-var" ] }, { "kind": "type", "rules": [ "type-var" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": null }, { "kind": "type", "rules": [ "override" ] }, { "kind": "type", "rules": [ "override" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "name-defined" ] }, { "kind": "type", "rules": [ "assignment", "misc" ] }, { "kind": "type", "rules": [ "misc" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "no-redef" ] }, { "kind": "type", "rules": [ "misc", "no-redef" ] }, { "kind": "type", "rules": [ "misc" ] }, { "kind": "type", "rules": [ "misc" ] }, { "kind": "type", "rules": [ "no-redef" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": [ "no-redef" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "call-arg" ] }, { "kind": "type", "rules": [ "assignment" ] }, { "kind": "type", "rules": null }, { "kind": "type", "rules": [ "attr-defined" ] }, { "kind": "type", "rules": [ "attr-defined" ] } ], "n_type_ignores": 111 }